Minero Game Engine 0.0.1`
Faction Warfare
Loading...
Searching...
No Matches
avx512vlintrin.h
Go to the documentation of this file.
1/* Copyright (C) 2014-2022 Free Software Foundation, Inc.
2
3 This file is part of GCC.
4
5 GCC is free software; you can redistribute it and/or modify
6 it under the terms of the GNU General Public License as published by
7 the Free Software Foundation; either version 3, or (at your option)
8 any later version.
9
10 GCC is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 GNU General Public License for more details.
14
15 Under Section 7 of GPL version 3, you are granted additional
16 permissions described in the GCC Runtime Library Exception, version
17 3.1, as published by the Free Software Foundation.
18
19 You should have received a copy of the GNU General Public License and
20 a copy of the GCC Runtime Library Exception along with this program;
21 see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
22 <http://www.gnu.org/licenses/>. */
23
24#ifndef _IMMINTRIN_H_INCLUDED
25#error "Never use <avx512vlintrin.h> directly; include <immintrin.h> instead."
26#endif
27
28#ifndef _AVX512VLINTRIN_H_INCLUDED
29#define _AVX512VLINTRIN_H_INCLUDED
30
31#ifndef __AVX512VL__
32#pragma GCC push_options
33#pragma GCC target("avx512vl")
34#define __DISABLE_AVX512VL__
35#endif /* __AVX512VL__ */
36
37/* Internal data types for implementing the intrinsics. */
38typedef unsigned int __mmask32;
41typedef int __v8si_u __attribute__ ((__vector_size__ (32), \
43typedef long long __v2di_u __attribute__ ((__vector_size__ (16), \
45typedef long long __v4di_u __attribute__ ((__vector_size__ (32), \
47
48extern __inline __m256d
51{
53 (__v4df) __W,
54 (__mmask8) __U);
55}
56
57extern __inline __m256d
60{
62 (__v4df)
64 (__mmask8) __U);
65}
66
67extern __inline __m128d
70{
72 (__v2df) __W,
73 (__mmask8) __U);
74}
75
76extern __inline __m128d
79{
81 (__v2df)
83 (__mmask8) __U);
84}
85
86extern __inline __m256d
89{
91 (__v4df) __W,
92 (__mmask8) __U);
93}
94
95extern __inline __m256d
98{
100 (__v4df)
102 (__mmask8) __U);
103}
104
105extern __inline __m128d
108{
110 (__v2df) __W,
111 (__mmask8) __U);
112}
113
114extern __inline __m128d
116_mm_maskz_load_pd (__mmask8 __U, void const *__P)
117{
119 (__v2df)
121 (__mmask8) __U);
122}
123
124extern __inline void
127{
129 (__v4df) __A,
130 (__mmask8) __U);
131}
132
133extern __inline void
136{
138 (__v2df) __A,
139 (__mmask8) __U);
140}
141
142extern __inline __m256
145{
147 (__v8sf) __W,
148 (__mmask8) __U);
149}
150
151extern __inline __m256
154{
156 (__v8sf)
158 (__mmask8) __U);
159}
160
161extern __inline __m128
164{
166 (__v4sf) __W,
167 (__mmask8) __U);
168}
169
170extern __inline __m128
173{
175 (__v4sf)
177 (__mmask8) __U);
178}
179
180extern __inline __m256
183{
185 (__v8sf) __W,
186 (__mmask8) __U);
187}
188
189extern __inline __m256
192{
194 (__v8sf)
196 (__mmask8) __U);
197}
198
199extern __inline __m128
202{
204 (__v4sf) __W,
205 (__mmask8) __U);
206}
207
208extern __inline __m128
210_mm_maskz_load_ps (__mmask8 __U, void const *__P)
211{
213 (__v4sf)
215 (__mmask8) __U);
216}
217
218extern __inline void
221{
223 (__v8sf) __A,
224 (__mmask8) __U);
225}
226
227extern __inline void
230{
232 (__v4sf) __A,
233 (__mmask8) __U);
234}
235
236extern __inline __m256i
239{
241 (__v4di) __W,
242 (__mmask8) __U);
243}
244
245extern __inline __m256i
248{
250 (__v4di)
252 (__mmask8) __U);
253}
254
255extern __inline __m128i
258{
260 (__v2di) __W,
261 (__mmask8) __U);
262}
263
264extern __inline __m128i
267{
269 (__v2di)
271 (__mmask8) __U);
272}
273
274extern __inline __m256i
280
281extern __inline __m256i
284{
286 (__v4di) __W,
287 (__mmask8)
288 __U);
289}
290
291extern __inline __m256i
294{
296 (__v4di)
298 (__mmask8)
299 __U);
300}
301
302extern __inline __m128i
304_mm_load_epi64 (void const *__P)
305{
306 return (__m128i) (*(__v2di *) __P);
307}
308
309extern __inline __m128i
312{
314 (__v2di) __W,
315 (__mmask8)
316 __U);
317}
318
319extern __inline __m128i
322{
324 (__v2di)
326 (__mmask8)
327 __U);
328}
329
330extern __inline void
333{
335 (__v4di) __A,
336 (__mmask8) __U);
337}
338
339extern __inline void
342{
344 (__v2di) __A,
345 (__mmask8) __U);
346}
347
348extern __inline __m256i
351{
353 (__v8si) __W,
354 (__mmask8) __U);
355}
356
357extern __inline __m256i
360{
362 (__v8si)
364 (__mmask8) __U);
365}
366
367extern __inline __m128i
370{
372 (__v4si) __W,
373 (__mmask8) __U);
374}
375
376extern __inline __m128i
379{
381 (__v4si)
383 (__mmask8) __U);
384}
385
386extern __inline __m256i
388_mm256_load_epi32 (void const *__P)
389{
390 return (__m256i) (*(__v8si *) __P);
391}
392
393extern __inline __m256i
396{
398 (__v8si) __W,
399 (__mmask8)
400 __U);
401}
402
403extern __inline __m256i
406{
408 (__v8si)
410 (__mmask8)
411 __U);
412}
413
414extern __inline __m128i
416_mm_load_epi32 (void const *__P)
417{
418 return (__m128i) (*(__v4si *) __P);
419}
420
421extern __inline __m128i
424{
426 (__v4si) __W,
427 (__mmask8)
428 __U);
429}
430
431extern __inline __m128i
434{
436 (__v4si)
438 (__mmask8)
439 __U);
440}
441
442extern __inline void
445{
446 *(__v8si *) __P = (__v8si) __A;
447}
448
449extern __inline void
452{
454 (__v8si) __A,
455 (__mmask8) __U);
456}
457
458extern __inline void
461{
462 *(__v4si *) __P = (__v4si) __A;
463}
464
465extern __inline void
468{
470 (__v4si) __A,
471 (__mmask8) __U);
472}
473
474extern __inline __m128d
477{
479 (__v2df) __B,
480 (__v2df) __W,
481 (__mmask8) __U);
482}
483
484extern __inline __m128d
487{
489 (__v2df) __B,
490 (__v2df)
492 (__mmask8) __U);
493}
494
495extern __inline __m256d
498 __m256d __B)
499{
501 (__v4df) __B,
502 (__v4df) __W,
503 (__mmask8) __U);
504}
505
506extern __inline __m256d
509{
511 (__v4df) __B,
512 (__v4df)
514 (__mmask8) __U);
515}
516
517extern __inline __m128
520{
522 (__v4sf) __B,
523 (__v4sf) __W,
524 (__mmask8) __U);
525}
526
527extern __inline __m128
530{
532 (__v4sf) __B,
533 (__v4sf)
535 (__mmask8) __U);
536}
537
538extern __inline __m256
541{
543 (__v8sf) __B,
544 (__v8sf) __W,
545 (__mmask8) __U);
546}
547
548extern __inline __m256
551{
553 (__v8sf) __B,
554 (__v8sf)
556 (__mmask8) __U);
557}
558
559extern __inline __m128d
562{
564 (__v2df) __B,
565 (__v2df) __W,
566 (__mmask8) __U);
567}
568
569extern __inline __m128d
572{
574 (__v2df) __B,
575 (__v2df)
577 (__mmask8) __U);
578}
579
580extern __inline __m256d
583 __m256d __B)
584{
586 (__v4df) __B,
587 (__v4df) __W,
588 (__mmask8) __U);
589}
590
591extern __inline __m256d
594{
596 (__v4df) __B,
597 (__v4df)
599 (__mmask8) __U);
600}
601
602extern __inline __m128
605{
607 (__v4sf) __B,
608 (__v4sf) __W,
609 (__mmask8) __U);
610}
611
612extern __inline __m128
615{
617 (__v4sf) __B,
618 (__v4sf)
620 (__mmask8) __U);
621}
622
623extern __inline __m256
626{
628 (__v8sf) __B,
629 (__v8sf) __W,
630 (__mmask8) __U);
631}
632
633extern __inline __m256
636{
638 (__v8sf) __B,
639 (__v8sf)
641 (__mmask8) __U);
642}
643
644extern __inline void
647{
648 *(__m256i *) __P = __A;
649}
650
651extern __inline void
654{
655 *(__m128i *) __P = __A;
656}
657
658extern __inline __m256d
661{
662 return (__m256d) __builtin_ia32_loadupd256_mask ((const double *) __P,
663 (__v4df) __W,
664 (__mmask8) __U);
665}
666
667extern __inline __m256d
670{
671 return (__m256d) __builtin_ia32_loadupd256_mask ((const double *) __P,
672 (__v4df)
674 (__mmask8) __U);
675}
676
677extern __inline __m128d
680{
681 return (__m128d) __builtin_ia32_loadupd128_mask ((const double *) __P,
682 (__v2df) __W,
683 (__mmask8) __U);
684}
685
686extern __inline __m128d
688_mm_maskz_loadu_pd (__mmask8 __U, void const *__P)
689{
690 return (__m128d) __builtin_ia32_loadupd128_mask ((const double *) __P,
691 (__v2df)
693 (__mmask8) __U);
694}
695
696extern __inline void
699{
701 (__v4df) __A,
702 (__mmask8) __U);
703}
704
705extern __inline void
708{
710 (__v2df) __A,
711 (__mmask8) __U);
712}
713
714extern __inline __m256
717{
718 return (__m256) __builtin_ia32_loadups256_mask ((const float *) __P,
719 (__v8sf) __W,
720 (__mmask8) __U);
721}
722
723extern __inline __m256
726{
727 return (__m256) __builtin_ia32_loadups256_mask ((const float *) __P,
728 (__v8sf)
730 (__mmask8) __U);
731}
732
733extern __inline __m128
736{
737 return (__m128) __builtin_ia32_loadups128_mask ((const float *) __P,
738 (__v4sf) __W,
739 (__mmask8) __U);
740}
741
742extern __inline __m128
744_mm_maskz_loadu_ps (__mmask8 __U, void const *__P)
745{
746 return (__m128) __builtin_ia32_loadups128_mask ((const float *) __P,
747 (__v4sf)
749 (__mmask8) __U);
750}
751
752extern __inline void
755{
757 (__v8sf) __A,
758 (__mmask8) __U);
759}
760
761extern __inline void
764{
766 (__v4sf) __A,
767 (__mmask8) __U);
768}
769
770extern __inline __m256i
772_mm256_loadu_epi64 (void const *__P)
773{
774 return (__m256i) (*(__v4di_u *) __P);
775}
776
777extern __inline __m256i
780{
781 return (__m256i) __builtin_ia32_loaddqudi256_mask ((const long long *) __P,
782 (__v4di) __W,
783 (__mmask8) __U);
784}
785
786extern __inline __m256i
789{
790 return (__m256i) __builtin_ia32_loaddqudi256_mask ((const long long *) __P,
791 (__v4di)
793 (__mmask8) __U);
794}
795
796extern __inline __m128i
798_mm_loadu_epi64 (void const *__P)
799{
800 return (__m128i) (*(__v2di_u *) __P);
801}
802
803extern __inline __m128i
806{
807 return (__m128i) __builtin_ia32_loaddqudi128_mask ((const long long *) __P,
808 (__v2di) __W,
809 (__mmask8) __U);
810}
811
812extern __inline __m128i
815{
816 return (__m128i) __builtin_ia32_loaddqudi128_mask ((const long long *) __P,
817 (__v2di)
819 (__mmask8) __U);
820}
821
822extern __inline void
825{
826 *(__m256i_u *) __P = (__m256i_u) __A;
827}
828
829extern __inline void
832{
834 (__v4di) __A,
835 (__mmask8) __U);
836}
837
838extern __inline void
841{
842 *(__m128i_u *) __P = (__m128i_u) __A;
843}
844
845extern __inline void
848{
850 (__v2di) __A,
851 (__mmask8) __U);
852}
853
854extern __inline __m256i
856_mm256_loadu_epi32 (void const *__P)
857{
858 return (__m256i) (*(__v8si_u *) __P);
859}
860
861extern __inline __m256i
864{
865 return (__m256i) __builtin_ia32_loaddqusi256_mask ((const int *) __P,
866 (__v8si) __W,
867 (__mmask8) __U);
868}
869
870extern __inline __m256i
873{
874 return (__m256i) __builtin_ia32_loaddqusi256_mask ((const int *) __P,
875 (__v8si)
877 (__mmask8) __U);
878}
879
880extern __inline __m128i
882_mm_loadu_epi32 (void const *__P)
883{
884 return (__m128i) (*(__v4si_u *) __P);
885}
886
887extern __inline __m128i
890{
891 return (__m128i) __builtin_ia32_loaddqusi128_mask ((const int *) __P,
892 (__v4si) __W,
893 (__mmask8) __U);
894}
895
896extern __inline __m128i
899{
900 return (__m128i) __builtin_ia32_loaddqusi128_mask ((const int *) __P,
901 (__v4si)
903 (__mmask8) __U);
904}
905
906extern __inline void
909{
910 *(__m256i_u *) __P = (__m256i_u) __A;
911}
912
913extern __inline void
916{
918 (__v8si) __A,
919 (__mmask8) __U);
920}
921
922extern __inline void
925{
926 *(__m128i_u *) __P = (__m128i_u) __A;
927}
928
929extern __inline void
932{
934 (__v4si) __A,
935 (__mmask8) __U);
936}
937
938extern __inline __m256i
941{
943 (__v8si) __W,
944 (__mmask8) __U);
945}
946
947extern __inline __m256i
950{
952 (__v8si)
954 (__mmask8) __U);
955}
956
957extern __inline __m128i
960{
962 (__v4si) __W,
963 (__mmask8) __U);
964}
965
966extern __inline __m128i
969{
971 (__v4si)
973 (__mmask8) __U);
974}
975
976extern __inline __m256i
979{
981 (__v4di)
983 (__mmask8) -1);
984}
985
986extern __inline __m256i
989{
991 (__v4di) __W,
992 (__mmask8) __U);
993}
994
995extern __inline __m256i
998{
1000 (__v4di)
1002 (__mmask8) __U);
1003}
1004
1005extern __inline __m128i
1008{
1010 (__v2di)
1012 (__mmask8) -1);
1013}
1014
1015extern __inline __m128i
1018{
1020 (__v2di) __W,
1021 (__mmask8) __U);
1022}
1023
1024extern __inline __m128i
1027{
1029 (__v2di)
1031 (__mmask8) __U);
1032}
1033
1034extern __inline __m128i
1037{
1039 (__v4si)
1041 (__mmask8) -1);
1042}
1043
1044extern __inline __m128i
1047{
1049 (__v4si) __W,
1050 (__mmask8) __U);
1051}
1052
1053extern __inline __m128i
1056{
1058 (__v4si)
1060 (__mmask8) __U);
1061}
1062
1063extern __inline __m128i
1066{
1068 (__v4si)
1070 (__mmask8) -1);
1071}
1072
1073extern __inline __m128i
1076{
1078 (__v4si) __W,
1079 (__mmask8) __U);
1080}
1081
1082extern __inline __m128i
1085{
1087 (__v4si)
1089 (__mmask8) __U);
1090}
1091
1092extern __inline __m256i
1095{
1097 (__v8si) __W,
1098 (__mmask8) __U);
1099}
1100
1101extern __inline __m256i
1104{
1106 (__v8si)
1108 (__mmask8) __U);
1109}
1110
1111extern __inline __m128i
1114{
1116 (__v4si) __W,
1117 (__mmask8) __U);
1118}
1119
1120extern __inline __m128i
1123{
1125 (__v4si)
1127 (__mmask8) __U);
1128}
1129
1130extern __inline __m256i
1133{
1135 (__v8si)
1137 (__mmask8) -1);
1138}
1139
1140extern __inline __m256i
1143{
1145 (__v8si) __W,
1146 (__mmask8) __U);
1147}
1148
1149extern __inline __m256i
1152{
1154 (__v8si)
1156 (__mmask8) __U);
1157}
1158
1159extern __inline __m128i
1162{
1164 (__v4si)
1166 (__mmask8) -1);
1167}
1168
1169extern __inline __m128i
1172{
1174 (__v4si) __W,
1175 (__mmask8) __U);
1176}
1177
1178extern __inline __m128i
1181{
1183 (__v4si)
1185 (__mmask8) __U);
1186}
1187
1188extern __inline __m128i
1191{
1193 (__v4si) __W,
1194 (__mmask8) __U);
1195}
1196
1197extern __inline __m128i
1200{
1202 (__v4si)
1204 (__mmask8) __U);
1205}
1206
1207extern __inline __m128i
1210{
1212 (__v4si) __W,
1213 (__mmask8) __U);
1214}
1215
1216extern __inline __m128i
1219{
1221 (__v4si)
1223 (__mmask8) __U);
1224}
1225
1226extern __inline __m128i
1229{
1231 (__v4si)
1233 (__mmask8) -1);
1234}
1235
1236extern __inline __m128i
1239{
1241 (__v4si) __W,
1242 (__mmask8) __U);
1243}
1244
1245extern __inline __m128i
1248{
1250 (__v4si)
1252 (__mmask8) __U);
1253}
1254
1255extern __inline __m128i
1258{
1260 (__v4si)
1262 (__mmask8) -1);
1263}
1264
1265extern __inline __m128i
1268{
1270 (__v4si) __W,
1271 (__mmask8) __U);
1272}
1273
1274extern __inline __m128i
1277{
1279 (__v4si)
1281 (__mmask8) __U);
1282}
1283
1284extern __inline __m128i
1287{
1289 (__v4si) __W,
1290 (__mmask8) __U);
1291}
1292
1293extern __inline __m128i
1296{
1298 (__v4si)
1300 (__mmask8) __U);
1301}
1302
1303extern __inline __m128i
1306{
1308 (__v4si) __W,
1309 (__mmask8) __U);
1310}
1311
1312extern __inline __m128i
1315{
1317 (__v4si)
1319 (__mmask8) __U);
1320}
1321
1322extern __inline __m256d
1325{
1327 (__v4df) __W,
1328 (__mmask8) __U);
1329}
1330
1331extern __inline __m256d
1334{
1336 (__v4df)
1338 (__mmask8) __U);
1339}
1340
1341extern __inline __m128d
1344{
1346 (__v2df) __W,
1347 (__mmask8) __U);
1348}
1349
1350extern __inline __m128d
1353{
1355 (__v2df)
1356 _mm_setzero_pd (),
1357 (__mmask8) __U);
1358}
1359
1360extern __inline __m256d
1363{
1365 (__v4df)
1367 (__mmask8) -1);
1368}
1369
1370extern __inline __m256d
1373{
1375 (__v4df) __W,
1376 (__mmask8) __U);
1377}
1378
1379extern __inline __m256d
1382{
1384 (__v4df)
1386 (__mmask8) __U);
1387}
1388
1389extern __inline __m128d
1392{
1394 (__v2df)
1395 _mm_setzero_pd (),
1396 (__mmask8) -1);
1397}
1398
1399extern __inline __m128d
1402{
1404 (__v2df) __W,
1405 (__mmask8) __U);
1406}
1407
1408extern __inline __m128d
1411{
1413 (__v2df)
1414 _mm_setzero_pd (),
1415 (__mmask8) __U);
1416}
1417
1418extern __inline __m256
1421{
1423 (__v8sf) __W,
1424 (__mmask8) __U);
1425}
1426
1427extern __inline __m256
1430{
1432 (__v8sf)
1434 (__mmask8) __U);
1435}
1436
1437extern __inline __m128
1440{
1442 (__v4sf) __W,
1443 (__mmask8) __U);
1444}
1445
1446extern __inline __m128
1449{
1451 (__v4sf)
1452 _mm_setzero_ps (),
1453 (__mmask8) __U);
1454}
1455
1456extern __inline __m256
1459{
1461 (__v8sf)
1463 (__mmask8) -1);
1464}
1465
1466extern __inline __m256
1469{
1471 (__v8sf) __W,
1472 (__mmask8) __U);
1473}
1474
1475extern __inline __m256
1478{
1480 (__v8sf)
1482 (__mmask8) __U);
1483}
1484
1485extern __inline __m128
1488{
1490 (__v4sf)
1491 _mm_setzero_ps (),
1492 (__mmask8) -1);
1493}
1494
1495extern __inline __m128
1498{
1500 (__v4sf) __W,
1501 (__mmask8) __U);
1502}
1503
1504extern __inline __m128
1507{
1509 (__v4sf)
1510 _mm_setzero_ps (),
1511 (__mmask8) __U);
1512}
1513
1514extern __inline __m256d
1517{
1519 (__v4df) __W,
1520 (__mmask8) __U);
1521}
1522
1523extern __inline __m256d
1526{
1528 (__v4df)
1530 (__mmask8) __U);
1531}
1532
1533extern __inline __m128d
1536{
1538 (__v2df) __W,
1539 (__mmask8) __U);
1540}
1541
1542extern __inline __m128d
1545{
1547 (__v2df)
1548 _mm_setzero_pd (),
1549 (__mmask8) __U);
1550}
1551
1552extern __inline __m128i
1555{
1557 (__v16qi)
1559 (__mmask8) -1);
1560}
1561
1562extern __inline void
1565{
1566 __builtin_ia32_pmovdb128mem_mask ((unsigned int *) __P, (__v4si) __A, __M);
1567}
1568
1569extern __inline __m128i
1572{
1574 (__v16qi) __O, __M);
1575}
1576
1577extern __inline __m128i
1580{
1582 (__v16qi)
1584 __M);
1585}
1586
1587extern __inline __m128i
1590{
1592 (__v16qi)
1594 (__mmask8) -1);
1595}
1596
1597extern __inline __m128i
1600{
1602 (__v16qi) __O, __M);
1603}
1604
1605extern __inline void
1608{
1609 __builtin_ia32_pmovdb256mem_mask ((unsigned long long *) __P, (__v8si) __A, __M);
1610}
1611
1612extern __inline __m128i
1615{
1617 (__v16qi)
1619 __M);
1620}
1621
1622extern __inline __m128i
1625{
1627 (__v16qi)
1629 (__mmask8) -1);
1630}
1631
1632extern __inline void
1635{
1636 __builtin_ia32_pmovsdb128mem_mask ((unsigned int *) __P, (__v4si) __A, __M);
1637}
1638
1639extern __inline __m128i
1642{
1644 (__v16qi) __O, __M);
1645}
1646
1647extern __inline __m128i
1650{
1652 (__v16qi)
1654 __M);
1655}
1656
1657extern __inline __m128i
1660{
1662 (__v16qi)
1664 (__mmask8) -1);
1665}
1666
1667extern __inline void
1670{
1671 __builtin_ia32_pmovsdb256mem_mask ((unsigned long long *) __P, (__v8si) __A, __M);
1672}
1673
1674extern __inline __m128i
1677{
1679 (__v16qi) __O, __M);
1680}
1681
1682extern __inline __m128i
1685{
1687 (__v16qi)
1689 __M);
1690}
1691
1692extern __inline __m128i
1695{
1697 (__v16qi)
1699 (__mmask8) -1);
1700}
1701
1702extern __inline void
1705{
1706 __builtin_ia32_pmovusdb128mem_mask ((unsigned int *) __P, (__v4si) __A, __M);
1707}
1708
1709extern __inline __m128i
1712{
1714 (__v16qi) __O,
1715 __M);
1716}
1717
1718extern __inline __m128i
1721{
1723 (__v16qi)
1725 __M);
1726}
1727
1728extern __inline __m128i
1731{
1733 (__v16qi)
1735 (__mmask8) -1);
1736}
1737
1738extern __inline void
1741{
1742 __builtin_ia32_pmovusdb256mem_mask ((unsigned long long *) __P, (__v8si) __A, __M);
1743}
1744
1745extern __inline __m128i
1748{
1750 (__v16qi) __O,
1751 __M);
1752}
1753
1754extern __inline __m128i
1757{
1759 (__v16qi)
1761 __M);
1762}
1763
1764extern __inline __m128i
1767{
1769 (__v8hi)
1771 (__mmask8) -1);
1772}
1773
1774extern __inline void
1777{
1778 __builtin_ia32_pmovdw128mem_mask ((unsigned long long *) __P, (__v4si) __A, __M);
1779}
1780
1781extern __inline __m128i
1784{
1786 (__v8hi) __O, __M);
1787}
1788
1789extern __inline __m128i
1792{
1794 (__v8hi)
1796 __M);
1797}
1798
1799extern __inline __m128i
1802{
1804 (__v8hi)
1806 (__mmask8) -1);
1807}
1808
1809extern __inline void
1812{
1814}
1815
1816extern __inline __m128i
1819{
1821 (__v8hi) __O, __M);
1822}
1823
1824extern __inline __m128i
1827{
1829 (__v8hi)
1831 __M);
1832}
1833
1834extern __inline __m128i
1837{
1839 (__v8hi)
1841 (__mmask8) -1);
1842}
1843
1844extern __inline void
1847{
1848 __builtin_ia32_pmovsdw128mem_mask ((unsigned long long *) __P, (__v4si) __A, __M);
1849}
1850
1851extern __inline __m128i
1854{
1856 (__v8hi)__O,
1857 __M);
1858}
1859
1860extern __inline __m128i
1863{
1865 (__v8hi)
1867 __M);
1868}
1869
1870extern __inline __m128i
1873{
1875 (__v8hi)
1877 (__mmask8) -1);
1878}
1879
1880extern __inline void
1883{
1885}
1886
1887extern __inline __m128i
1890{
1892 (__v8hi) __O, __M);
1893}
1894
1895extern __inline __m128i
1898{
1900 (__v8hi)
1902 __M);
1903}
1904
1905extern __inline __m128i
1908{
1910 (__v8hi)
1912 (__mmask8) -1);
1913}
1914
1915extern __inline void
1918{
1919 __builtin_ia32_pmovusdw128mem_mask ((unsigned long long *) __P, (__v4si) __A, __M);
1920}
1921
1922extern __inline __m128i
1925{
1927 (__v8hi) __O, __M);
1928}
1929
1930extern __inline __m128i
1933{
1935 (__v8hi)
1937 __M);
1938}
1939
1940extern __inline __m128i
1943{
1945 (__v8hi)
1947 (__mmask8) -1);
1948}
1949
1950extern __inline void
1953{
1955}
1956
1957extern __inline __m128i
1960{
1962 (__v8hi) __O, __M);
1963}
1964
1965extern __inline __m128i
1968{
1970 (__v8hi)
1972 __M);
1973}
1974
1975extern __inline __m128i
1978{
1980 (__v16qi)
1982 (__mmask8) -1);
1983}
1984
1985extern __inline void
1988{
1989 __builtin_ia32_pmovqb128mem_mask ((unsigned short *) __P, (__v2di) __A, __M);
1990}
1991
1992extern __inline __m128i
1995{
1997 (__v16qi) __O, __M);
1998}
1999
2000extern __inline __m128i
2003{
2005 (__v16qi)
2007 __M);
2008}
2009
2010extern __inline __m128i
2013{
2015 (__v16qi)
2017 (__mmask8) -1);
2018}
2019
2020extern __inline void
2023{
2024 __builtin_ia32_pmovqb256mem_mask ((unsigned int *) __P, (__v4di) __A, __M);
2025}
2026
2027extern __inline __m128i
2030{
2032 (__v16qi) __O, __M);
2033}
2034
2035extern __inline __m128i
2038{
2040 (__v16qi)
2042 __M);
2043}
2044
2045extern __inline __m128i
2048{
2050 (__v16qi)
2052 (__mmask8) -1);
2053}
2054
2055extern __inline void
2058{
2059 __builtin_ia32_pmovsqb128mem_mask ((unsigned short *) __P, (__v2di) __A, __M);
2060}
2061
2062extern __inline __m128i
2065{
2067 (__v16qi) __O, __M);
2068}
2069
2070extern __inline __m128i
2073{
2075 (__v16qi)
2077 __M);
2078}
2079
2080extern __inline __m128i
2083{
2085 (__v16qi)
2087 (__mmask8) -1);
2088}
2089
2090extern __inline void
2093{
2094 __builtin_ia32_pmovsqb256mem_mask ((unsigned int *) __P, (__v4di) __A, __M);
2095}
2096
2097extern __inline __m128i
2100{
2102 (__v16qi) __O, __M);
2103}
2104
2105extern __inline __m128i
2108{
2110 (__v16qi)
2112 __M);
2113}
2114
2115extern __inline __m128i
2118{
2120 (__v16qi)
2122 (__mmask8) -1);
2123}
2124
2125extern __inline void
2128{
2129 __builtin_ia32_pmovusqb128mem_mask ((unsigned short *) __P, (__v2di) __A, __M);
2130}
2131
2132extern __inline __m128i
2135{
2137 (__v16qi) __O,
2138 __M);
2139}
2140
2141extern __inline __m128i
2144{
2146 (__v16qi)
2148 __M);
2149}
2150
2151extern __inline __m128i
2154{
2156 (__v16qi)
2158 (__mmask8) -1);
2159}
2160
2161extern __inline void
2164{
2165 __builtin_ia32_pmovusqb256mem_mask ((unsigned int *) __P, (__v4di) __A, __M);
2166}
2167
2168extern __inline __m128i
2171{
2173 (__v16qi) __O,
2174 __M);
2175}
2176
2177extern __inline __m128i
2180{
2182 (__v16qi)
2184 __M);
2185}
2186
2187extern __inline __m128i
2190{
2192 (__v8hi)
2194 (__mmask8) -1);
2195}
2196
2197extern __inline void
2200{
2201 __builtin_ia32_pmovqw128mem_mask ((unsigned int *) __P, (__v2di) __A, __M);
2202}
2203
2204extern __inline __m128i
2207{
2209 (__v8hi)__O,
2210 __M);
2211}
2212
2213extern __inline __m128i
2216{
2218 (__v8hi)
2220 __M);
2221}
2222
2223extern __inline __m128i
2226{
2228 (__v8hi)
2230 (__mmask8) -1);
2231}
2232
2233extern __inline void
2236{
2237 __builtin_ia32_pmovqw256mem_mask ((unsigned long long *) __P, (__v4di) __A, __M);
2238}
2239
2240extern __inline __m128i
2243{
2245 (__v8hi) __O, __M);
2246}
2247
2248extern __inline __m128i
2251{
2253 (__v8hi)
2255 __M);
2256}
2257
2258extern __inline __m128i
2261{
2263 (__v8hi)
2265 (__mmask8) -1);
2266}
2267
2268extern __inline void
2271{
2272 __builtin_ia32_pmovsqw128mem_mask ((unsigned int *) __P, (__v2di) __A, __M);
2273}
2274
2275extern __inline __m128i
2278{
2280 (__v8hi) __O, __M);
2281}
2282
2283extern __inline __m128i
2286{
2288 (__v8hi)
2290 __M);
2291}
2292
2293extern __inline __m128i
2296{
2298 (__v8hi)
2300 (__mmask8) -1);
2301}
2302
2303extern __inline void
2306{
2307 __builtin_ia32_pmovsqw256mem_mask ((unsigned long long *) __P, (__v4di) __A, __M);
2308}
2309
2310extern __inline __m128i
2313{
2315 (__v8hi) __O, __M);
2316}
2317
2318extern __inline __m128i
2321{
2323 (__v8hi)
2325 __M);
2326}
2327
2328extern __inline __m128i
2331{
2333 (__v8hi)
2335 (__mmask8) -1);
2336}
2337
2338extern __inline void
2341{
2342 __builtin_ia32_pmovusqw128mem_mask ((unsigned int *) __P, (__v2di) __A, __M);
2343}
2344
2345extern __inline __m128i
2348{
2350 (__v8hi) __O, __M);
2351}
2352
2353extern __inline __m128i
2356{
2358 (__v8hi)
2360 __M);
2361}
2362
2363extern __inline __m128i
2366{
2368 (__v8hi)
2370 (__mmask8) -1);
2371}
2372
2373extern __inline void
2376{
2377 __builtin_ia32_pmovusqw256mem_mask ((unsigned long long *) __P, (__v4di) __A, __M);
2378}
2379
2380extern __inline __m128i
2383{
2385 (__v8hi) __O, __M);
2386}
2387
2388extern __inline __m128i
2391{
2393 (__v8hi)
2395 __M);
2396}
2397
2398extern __inline __m128i
2401{
2403 (__v4si)
2405 (__mmask8) -1);
2406}
2407
2408extern __inline void
2411{
2412 __builtin_ia32_pmovqd128mem_mask ((unsigned long long *) __P,
2413 (__v2di) __A, __M);
2414}
2415
2416extern __inline __m128i
2419{
2421 (__v4si) __O, __M);
2422}
2423
2424extern __inline __m128i
2427{
2429 (__v4si)
2431 __M);
2432}
2433
2434extern __inline __m128i
2437{
2439 (__v4si)
2441 (__mmask8) -1);
2442}
2443
2444extern __inline void
2447{
2449}
2450
2451extern __inline __m128i
2454{
2456 (__v4si) __O, __M);
2457}
2458
2459extern __inline __m128i
2462{
2464 (__v4si)
2466 __M);
2467}
2468
2469extern __inline __m128i
2472{
2474 (__v4si)
2476 (__mmask8) -1);
2477}
2478
2479extern __inline void
2482{
2483 __builtin_ia32_pmovsqd128mem_mask ((unsigned long long *) __P, (__v2di) __A, __M);
2484}
2485
2486extern __inline __m128i
2489{
2491 (__v4si) __O, __M);
2492}
2493
2494extern __inline __m128i
2497{
2499 (__v4si)
2501 __M);
2502}
2503
2504extern __inline __m128i
2507{
2509 (__v4si)
2511 (__mmask8) -1);
2512}
2513
2514extern __inline void
2517{
2519}
2520
2521extern __inline __m128i
2524{
2526 (__v4si)__O,
2527 __M);
2528}
2529
2530extern __inline __m128i
2533{
2535 (__v4si)
2537 __M);
2538}
2539
2540extern __inline __m128i
2543{
2545 (__v4si)
2547 (__mmask8) -1);
2548}
2549
2550extern __inline void
2553{
2554 __builtin_ia32_pmovusqd128mem_mask ((unsigned long long *) __P, (__v2di) __A, __M);
2555}
2556
2557extern __inline __m128i
2560{
2562 (__v4si) __O, __M);
2563}
2564
2565extern __inline __m128i
2568{
2570 (__v4si)
2572 __M);
2573}
2574
2575extern __inline __m128i
2578{
2580 (__v4si)
2582 (__mmask8) -1);
2583}
2584
2585extern __inline void
2588{
2590}
2591
2592extern __inline __m128i
2595{
2597 (__v4si) __O, __M);
2598}
2599
2600extern __inline __m128i
2603{
2605 (__v4si)
2607 __M);
2608}
2609
2610extern __inline __m256
2613{
2615 (__v8sf) __O,
2616 __M);
2617}
2618
2619extern __inline __m256
2622{
2624 (__v8sf)
2626 __M);
2627}
2628
2629extern __inline __m128
2632{
2634 (__v4sf) __O,
2635 __M);
2636}
2637
2638extern __inline __m128
2641{
2643 (__v4sf)
2644 _mm_setzero_ps (),
2645 __M);
2646}
2647
2648extern __inline __m256d
2651{
2653 (__v4df) __O,
2654 __M);
2655}
2656
2657extern __inline __m256d
2660{
2662 (__v4df)
2664 __M);
2665}
2666
2667extern __inline __m256i
2670{
2672 (__v8si) __O,
2673 __M);
2674}
2675
2676extern __inline __m256i
2679{
2681 (__v8si)
2683 __M);
2684}
2685
2686extern __inline __m256i
2689{
2691 __M);
2692}
2693
2694extern __inline __m256i
2697{
2699 (__v8si)
2701 __M);
2702}
2703
2704extern __inline __m128i
2707{
2709 (__v4si) __O,
2710 __M);
2711}
2712
2713extern __inline __m128i
2716{
2718 (__v4si)
2720 __M);
2721}
2722
2723extern __inline __m128i
2726{
2728 __M);
2729}
2730
2731extern __inline __m128i
2734{
2735 return (__m128i)
2738 __M);
2739}
2740
2741extern __inline __m256i
2744{
2746 (__v4di) __O,
2747 __M);
2748}
2749
2750extern __inline __m256i
2753{
2755 (__v4di)
2757 __M);
2758}
2759
2760extern __inline __m256i
2763{
2765 __M);
2766}
2767
2768extern __inline __m256i
2771{
2773 (__v4di)
2775 __M);
2776}
2777
2778extern __inline __m128i
2781{
2783 (__v2di) __O,
2784 __M);
2785}
2786
2787extern __inline __m128i
2790{
2792 (__v2di)
2794 __M);
2795}
2796
2797extern __inline __m128i
2800{
2802 __M);
2803}
2804
2805extern __inline __m128i
2808{
2809 return (__m128i)
2812 __M);
2813}
2814
2815extern __inline __m256
2818{
2821 (__mmask8) -1);
2822}
2823
2824extern __inline __m256
2827{
2829 (__v8sf) __O,
2830 __M);
2831}
2832
2833extern __inline __m256
2836{
2838 (__v8sf)
2840 __M);
2841}
2842
2843extern __inline __m256i
2846{
2848 __A,
2850 (__mmask8) -1);
2851}
2852
2853extern __inline __m256i
2856{
2858 __A,
2859 (__v8si)
2860 __O, __M);
2861}
2862
2863extern __inline __m256i
2866{
2868 __A,
2869 (__v8si)
2871 __M);
2872}
2873
2874extern __inline __m256i
2877{
2879 (__v8si) __W,
2880 (__mmask8) __U);
2881}
2882
2883extern __inline __m256i
2886{
2888 (__v8si)
2890 (__mmask8) __U);
2891}
2892
2893extern __inline __m128i
2896{
2898 (__v4si) __W,
2899 (__mmask8) __U);
2900}
2901
2902extern __inline __m128i
2905{
2907 (__v4si)
2909 (__mmask8) __U);
2910}
2911
2912extern __inline __m256i
2915{
2917 (__v4di) __W,
2918 (__mmask8) __U);
2919}
2920
2921extern __inline __m256i
2924{
2926 (__v4di)
2928 (__mmask8) __U);
2929}
2930
2931extern __inline __m128i
2934{
2936 (__v2di) __W,
2937 (__mmask8) __U);
2938}
2939
2940extern __inline __m128i
2943{
2945 (__v2di)
2947 (__mmask8) __U);
2948}
2949
2950extern __inline __m256i
2953{
2955 (__v8si) __W,
2956 (__mmask8) __U);
2957}
2958
2959extern __inline __m256i
2962{
2964 (__v8si)
2966 (__mmask8) __U);
2967}
2968
2969extern __inline __m128i
2972{
2974 (__v4si) __W,
2975 (__mmask8) __U);
2976}
2977
2978extern __inline __m128i
2981{
2983 (__v4si)
2985 (__mmask8) __U);
2986}
2987
2988extern __inline __m256i
2991{
2993 (__v4di) __W,
2994 (__mmask8) __U);
2995}
2996
2997extern __inline __m256i
3000{
3002 (__v4di)
3004 (__mmask8) __U);
3005}
3006
3007extern __inline __m128i
3010{
3012 (__v2di) __W,
3013 (__mmask8) __U);
3014}
3015
3016extern __inline __m128i
3019{
3021 (__v2di)
3023 (__mmask8) __U);
3024}
3025
3026extern __inline __m256i
3029{
3031 (__v4di) __W,
3032 (__mmask8) __U);
3033}
3034
3035extern __inline __m256i
3038{
3040 (__v4di)
3042 (__mmask8) __U);
3043}
3044
3045extern __inline __m128i
3048{
3050 (__v2di) __W,
3051 (__mmask8) __U);
3052}
3053
3054extern __inline __m128i
3057{
3059 (__v2di)
3061 (__mmask8) __U);
3062}
3063
3064extern __inline __m256i
3067{
3069 (__v8si) __W,
3070 (__mmask8) __U);
3071}
3072
3073extern __inline __m256i
3076{
3078 (__v8si)
3080 (__mmask8) __U);
3081}
3082
3083extern __inline __m128i
3086{
3088 (__v4si) __W,
3089 (__mmask8) __U);
3090}
3091
3092extern __inline __m128i
3095{
3097 (__v4si)
3099 (__mmask8) __U);
3100}
3101
3102extern __inline __m256i
3105{
3107 (__v4di) __W,
3108 (__mmask8) __U);
3109}
3110
3111extern __inline __m256i
3114{
3116 (__v4di)
3118 (__mmask8) __U);
3119}
3120
3121extern __inline __m128i
3124{
3126 (__v2di) __W,
3127 (__mmask8) __U);
3128}
3129
3130extern __inline __m128i
3133{
3135 (__v2di)
3137 (__mmask8) __U);
3138}
3139
3140extern __inline __m256i
3143{
3145 (__v8si) __W,
3146 (__mmask8) __U);
3147}
3148
3149extern __inline __m256i
3152{
3154 (__v8si)
3156 (__mmask8) __U);
3157}
3158
3159extern __inline __m128i
3162{
3164 (__v4si) __W,
3165 (__mmask8) __U);
3166}
3167
3168extern __inline __m128i
3171{
3173 (__v4si)
3175 (__mmask8) __U);
3176}
3177
3178extern __inline __m256i
3181{
3183 (__v4di) __W,
3184 (__mmask8) __U);
3185}
3186
3187extern __inline __m256i
3190{
3192 (__v4di)
3194 (__mmask8) __U);
3195}
3196
3197extern __inline __m128i
3200{
3202 (__v2di) __W,
3203 (__mmask8) __U);
3204}
3205
3206extern __inline __m128i
3209{
3211 (__v2di)
3213 (__mmask8) __U);
3214}
3215
3216extern __inline __m256i
3219{
3221 (__v4di) __W,
3222 (__mmask8) __U);
3223}
3224
3225extern __inline __m256i
3228{
3230 (__v4di)
3232 (__mmask8) __U);
3233}
3234
3235extern __inline __m128i
3238{
3240 (__v2di) __W,
3241 (__mmask8) __U);
3242}
3243
3244extern __inline __m128i
3247{
3249 (__v2di)
3251 (__mmask8) __U);
3252}
3253
3254extern __inline __m256d
3257{
3259 (__v4df)
3261 (__mmask8) -1);
3262}
3263
3264extern __inline __m256d
3267{
3269 (__v4df) __W,
3270 (__mmask8) __U);
3271}
3272
3273extern __inline __m256d
3276{
3278 (__v4df)
3280 (__mmask8) __U);
3281}
3282
3283extern __inline __m128d
3286{
3288 (__v2df)
3289 _mm_setzero_pd (),
3290 (__mmask8) -1);
3291}
3292
3293extern __inline __m128d
3296{
3298 (__v2df) __W,
3299 (__mmask8) __U);
3300}
3301
3302extern __inline __m128d
3305{
3307 (__v2df)
3308 _mm_setzero_pd (),
3309 (__mmask8) __U);
3310}
3311
3312extern __inline __m256
3315{
3317 (__v8sf)
3319 (__mmask8) -1);
3320}
3321
3322extern __inline __m256
3325{
3327 (__v8sf) __W,
3328 (__mmask8) __U);
3329}
3330
3331extern __inline __m256
3334{
3336 (__v8sf)
3338 (__mmask8) __U);
3339}
3340
3341extern __inline __m128
3344{
3346 (__v4sf)
3347 _mm_setzero_ps (),
3348 (__mmask8) -1);
3349}
3350
3351extern __inline __m128
3354{
3356 (__v4sf) __W,
3357 (__mmask8) __U);
3358}
3359
3360extern __inline __m128
3363{
3365 (__v4sf)
3366 _mm_setzero_ps (),
3367 (__mmask8) __U);
3368}
3369
3370extern __inline __m256d
3373{
3375 (__v4df)
3377 (__mmask8) -1);
3378}
3379
3380extern __inline __m256d
3383{
3385 (__v4df) __W,
3386 (__mmask8) __U);
3387}
3388
3389extern __inline __m256d
3392{
3394 (__v4df)
3396 (__mmask8) __U);
3397}
3398
3399extern __inline __m128d
3402{
3404 (__v2df)
3405 _mm_setzero_pd (),
3406 (__mmask8) -1);
3407}
3408
3409extern __inline __m128d
3412{
3414 (__v2df) __W,
3415 (__mmask8) __U);
3416}
3417
3418extern __inline __m128d
3421{
3423 (__v2df)
3424 _mm_setzero_pd (),
3425 (__mmask8) __U);
3426}
3427
3428extern __inline __m256
3431{
3433 (__v8sf)
3435 (__mmask8) -1);
3436}
3437
3438extern __inline __m256
3441{
3443 (__v8sf) __W,
3444 (__mmask8) __U);
3445}
3446
3447extern __inline __m256
3450{
3452 (__v8sf)
3454 (__mmask8) __U);
3455}
3456
3457extern __inline __m128
3460{
3462 (__v4sf)
3463 _mm_setzero_ps (),
3464 (__mmask8) -1);
3465}
3466
3467extern __inline __m128
3470{
3472 (__v4sf) __W,
3473 (__mmask8) __U);
3474}
3475
3476extern __inline __m128
3479{
3481 (__v4sf)
3482 _mm_setzero_ps (),
3483 (__mmask8) __U);
3484}
3485
3486extern __inline __m256d
3489{
3491 (__v4df) __W,
3492 (__mmask8) __U);
3493}
3494
3495extern __inline __m256d
3498{
3500 (__v4df)
3502 (__mmask8) __U);
3503}
3504
3505extern __inline __m128d
3508{
3510 (__v2df) __W,
3511 (__mmask8) __U);
3512}
3513
3514extern __inline __m128d
3517{
3519 (__v2df)
3520 _mm_setzero_pd (),
3521 (__mmask8) __U);
3522}
3523
3524extern __inline __m256
3527{
3529 (__v8sf) __W,
3530 (__mmask8) __U);
3531}
3532
3533extern __inline __m256
3536{
3538 (__v8sf)
3540 (__mmask8) __U);
3541}
3542
3543extern __inline __m128
3546{
3548 (__v4sf) __W,
3549 (__mmask8) __U);
3550}
3551
3552extern __inline __m128
3555{
3557 (__v4sf)
3558 _mm_setzero_ps (),
3559 (__mmask8) __U);
3560}
3561
3562extern __inline __m256i
3565 __m256i __B)
3566{
3568 (__v8si) __B,
3569 (__v8si) __W,
3570 (__mmask8) __U);
3571}
3572
3573extern __inline __m256i
3576{
3578 (__v8si) __B,
3579 (__v8si)
3581 (__mmask8) __U);
3582}
3583
3584extern __inline __m256i
3587 __m256i __B)
3588{
3590 (__v4di) __B,
3591 (__v4di) __W,
3592 (__mmask8) __U);
3593}
3594
3595extern __inline __m256i
3598{
3600 (__v4di) __B,
3601 (__v4di)
3603 (__mmask8) __U);
3604}
3605
3606extern __inline __m256i
3609 __m256i __B)
3610{
3612 (__v8si) __B,
3613 (__v8si) __W,
3614 (__mmask8) __U);
3615}
3616
3617extern __inline __m256i
3620{
3622 (__v8si) __B,
3623 (__v8si)
3625 (__mmask8) __U);
3626}
3627
3628extern __inline __m256i
3631 __m256i __B)
3632{
3634 (__v4di) __B,
3635 (__v4di) __W,
3636 (__mmask8) __U);
3637}
3638
3639extern __inline __m256i
3642{
3644 (__v4di) __B,
3645 (__v4di)
3647 (__mmask8) __U);
3648}
3649
3650extern __inline __m128i
3653 __m128i __B)
3654{
3656 (__v4si) __B,
3657 (__v4si) __W,
3658 (__mmask8) __U);
3659}
3660
3661extern __inline __m128i
3664{
3666 (__v4si) __B,
3667 (__v4si)
3669 (__mmask8) __U);
3670}
3671
3672extern __inline __m128i
3675 __m128i __B)
3676{
3678 (__v2di) __B,
3679 (__v2di) __W,
3680 (__mmask8) __U);
3681}
3682
3683extern __inline __m128i
3686{
3688 (__v2di) __B,
3689 (__v2di)
3691 (__mmask8) __U);
3692}
3693
3694extern __inline __m128i
3697 __m128i __B)
3698{
3700 (__v4si) __B,
3701 (__v4si) __W,
3702 (__mmask8) __U);
3703}
3704
3705extern __inline __m128i
3708{
3710 (__v4si) __B,
3711 (__v4si)
3713 (__mmask8) __U);
3714}
3715
3716extern __inline __m128i
3719 __m128i __B)
3720{
3722 (__v2di) __B,
3723 (__v2di) __W,
3724 (__mmask8) __U);
3725}
3726
3727extern __inline __m128i
3730{
3732 (__v2di) __B,
3733 (__v2di)
3735 (__mmask8) __U);
3736}
3737
3738extern __inline __m256
3741{
3743 (__v8sf)
3745 (__mmask8) -1);
3746}
3747
3748extern __inline __m256
3751{
3753 (__v8sf) __W,
3754 (__mmask8) __U);
3755}
3756
3757extern __inline __m256
3760{
3762 (__v8sf)
3764 (__mmask8) __U);
3765}
3766
3767extern __inline __m256d
3770{
3772 (__v4df)
3774 (__mmask8) -1);
3775}
3776
3777extern __inline __m256d
3780{
3782 (__v4df) __W,
3783 (__mmask8) __U);
3784}
3785
3786extern __inline __m256d
3789{
3791 (__v4df)
3793 (__mmask8) __U);
3794}
3795
3796extern __inline __m128
3799{
3801 (__v4sf)
3802 _mm_setzero_ps (),
3803 (__mmask8) -1);
3804}
3805
3806extern __inline __m128
3809{
3811 (__v4sf) __W,
3812 (__mmask8) __U);
3813}
3814
3815extern __inline __m128
3818{
3820 (__v4sf)
3821 _mm_setzero_ps (),
3822 (__mmask8) __U);
3823}
3824
3825extern __inline __m128d
3828{
3830 (__v2df)
3831 _mm_setzero_pd (),
3832 (__mmask8) -1);
3833}
3834
3835extern __inline __m128d
3838{
3840 (__v2df) __W,
3841 (__mmask8) __U);
3842}
3843
3844extern __inline __m128d
3847{
3849 (__v2df)
3850 _mm_setzero_pd (),
3851 (__mmask8) __U);
3852}
3853
3854extern __inline __m256i
3857 __m128i __B)
3858{
3860 (__v4si) __B,
3861 (__v8si) __W,
3862 (__mmask8) __U);
3863}
3864
3865extern __inline __m256i
3868{
3870 (__v4si) __B,
3871 (__v8si)
3873 (__mmask8) __U);
3874}
3875
3876extern __inline __m128i
3879 __m128i __B)
3880{
3882 (__v4si) __B,
3883 (__v4si) __W,
3884 (__mmask8) __U);
3885}
3886
3887extern __inline __m128i
3890{
3892 (__v4si) __B,
3893 (__v4si)
3895 (__mmask8) __U);
3896}
3897
3898extern __inline __m256i
3901 __m128i __B)
3902{
3904 (__v2di) __B,
3905 (__v4di) __W,
3906 (__mmask8) __U);
3907}
3908
3909extern __inline __m256i
3912{
3914 (__v2di) __B,
3915 (__v4di)
3917 (__mmask8) __U);
3918}
3919
3920extern __inline __m128i
3923 __m128i __B)
3924{
3926 (__v2di) __B,
3927 (__v2di) __W,
3928 (__mmask8) __U);
3929}
3930
3931extern __inline __m128i
3934{
3936 (__v2di) __B,
3937 (__v2di)
3939 (__mmask8) __U);
3940}
3941
3942extern __inline __m256i
3945 __m256i __B)
3946{
3948 (__v8si) __B,
3949 (__v8si) __W,
3950 (__mmask8) __U);
3951}
3952
3953extern __inline __m256i
3956{
3958 (__v8si) __B,
3959 (__v8si)
3961 (__mmask8) __U);
3962}
3963
3964extern __inline __m256d
3967{
3969 (__v4df) __B,
3970 (__v4df)
3972 (__mmask8) -1);
3973}
3974
3975extern __inline __m256d
3978 __m256d __B)
3979{
3981 (__v4df) __B,
3982 (__v4df) __W,
3983 (__mmask8) __U);
3984}
3985
3986extern __inline __m256d
3989{
3991 (__v4df) __B,
3992 (__v4df)
3994 (__mmask8) __U);
3995}
3996
3997extern __inline __m256
4000{
4002 (__v8sf) __B,
4003 (__v8sf)
4005 (__mmask8) -1);
4006}
4007
4008extern __inline __m256
4011 __m256 __B)
4012{
4014 (__v8sf) __B,
4015 (__v8sf) __W,
4016 (__mmask8) __U);
4017}
4018
4019extern __inline __m256
4022{
4024 (__v8sf) __B,
4025 (__v8sf)
4027 (__mmask8) __U);
4028}
4029
4030extern __inline __m128d
4033{
4035 (__v2df) __B,
4036 (__v2df)
4037 _mm_setzero_pd (),
4038 (__mmask8) -1);
4039}
4040
4041extern __inline __m128d
4044 __m128d __B)
4045{
4047 (__v2df) __B,
4048 (__v2df) __W,
4049 (__mmask8) __U);
4050}
4051
4052extern __inline __m128d
4055{
4057 (__v2df) __B,
4058 (__v2df)
4059 _mm_setzero_pd (),
4060 (__mmask8) __U);
4061}
4062
4063extern __inline __m128
4066{
4068 (__v4sf) __B,
4069 (__v4sf)
4070 _mm_setzero_ps (),
4071 (__mmask8) -1);
4072}
4073
4074extern __inline __m128
4077{
4079 (__v4sf) __B,
4080 (__v4sf) __W,
4081 (__mmask8) __U);
4082}
4083
4084extern __inline __m128
4087{
4089 (__v4sf) __B,
4090 (__v4sf)
4091 _mm_setzero_ps (),
4092 (__mmask8) __U);
4093}
4094
4095extern __inline __m256d
4099{
4101 (__v4df) __B,
4102 (__v4df) __C,
4103 (__mmask8) __U);
4104}
4105
4106extern __inline __m256d
4109 __mmask8 __U)
4110{
4112 (__v4df) __B,
4113 (__v4df) __C,
4114 (__mmask8) __U);
4115}
4116
4117extern __inline __m256d
4120 __m256d __C)
4121{
4123 (__v4df) __B,
4124 (__v4df) __C,
4125 (__mmask8) __U);
4126}
4127
4128extern __inline __m128d
4131{
4133 (__v2df) __B,
4134 (__v2df) __C,
4135 (__mmask8) __U);
4136}
4137
4138extern __inline __m128d
4141 __mmask8 __U)
4142{
4144 (__v2df) __B,
4145 (__v2df) __C,
4146 (__mmask8) __U);
4147}
4148
4149extern __inline __m128d
4152 __m128d __C)
4153{
4155 (__v2df) __B,
4156 (__v2df) __C,
4157 (__mmask8) __U);
4158}
4159
4160extern __inline __m256
4163{
4165 (__v8sf) __B,
4166 (__v8sf) __C,
4167 (__mmask8) __U);
4168}
4169
4170extern __inline __m256
4173 __mmask8 __U)
4174{
4176 (__v8sf) __B,
4177 (__v8sf) __C,
4178 (__mmask8) __U);
4179}
4180
4181extern __inline __m256
4184 __m256 __C)
4185{
4187 (__v8sf) __B,
4188 (__v8sf) __C,
4189 (__mmask8) __U);
4190}
4191
4192extern __inline __m128
4195{
4197 (__v4sf) __B,
4198 (__v4sf) __C,
4199 (__mmask8) __U);
4200}
4201
4202extern __inline __m128
4205{
4207 (__v4sf) __B,
4208 (__v4sf) __C,
4209 (__mmask8) __U);
4210}
4211
4212extern __inline __m128
4215{
4217 (__v4sf) __B,
4218 (__v4sf) __C,
4219 (__mmask8) __U);
4220}
4221
4222extern __inline __m256d
4225 __m256d __C)
4226{
4228 (__v4df) __B,
4229 (__v4df) __C,
4230 (__mmask8) __U);
4231}
4232
4233extern __inline __m256d
4236 __mmask8 __U)
4237{
4239 (__v4df) __B,
4240 (__v4df) __C,
4241 (__mmask8) __U);
4242}
4243
4244extern __inline __m256d
4247 __m256d __C)
4248{
4250 (__v4df) __B,
4251 (__v4df) __C,
4252 (__mmask8) __U);
4253}
4254
4255extern __inline __m128d
4258{
4260 (__v2df) __B,
4261 (__v2df) __C,
4262 (__mmask8) __U);
4263}
4264
4265extern __inline __m128d
4268 __mmask8 __U)
4269{
4271 (__v2df) __B,
4272 (__v2df) __C,
4273 (__mmask8) __U);
4274}
4275
4276extern __inline __m128d
4279 __m128d __C)
4280{
4282 (__v2df) __B,
4283 (__v2df) __C,
4284 (__mmask8) __U);
4285}
4286
4287extern __inline __m256
4290{
4292 (__v8sf) __B,
4293 (__v8sf) __C,
4294 (__mmask8) __U);
4295}
4296
4297extern __inline __m256
4300 __mmask8 __U)
4301{
4303 (__v8sf) __B,
4304 (__v8sf) __C,
4305 (__mmask8) __U);
4306}
4307
4308extern __inline __m256
4311 __m256 __C)
4312{
4314 (__v8sf) __B,
4315 (__v8sf) __C,
4316 (__mmask8) __U);
4317}
4318
4319extern __inline __m128
4322{
4324 (__v4sf) __B,
4325 (__v4sf) __C,
4326 (__mmask8) __U);
4327}
4328
4329extern __inline __m128
4332{
4334 (__v4sf) __B,
4335 (__v4sf) __C,
4336 (__mmask8) __U);
4337}
4338
4339extern __inline __m128
4342{
4344 (__v4sf) __B,
4345 (__v4sf) __C,
4346 (__mmask8) __U);
4347}
4348
4349extern __inline __m256d
4352 __m256d __C)
4353{
4355 (__v4df) __B,
4356 (__v4df) __C,
4357 (__mmask8) __U);
4358}
4359
4360extern __inline __m256d
4363 __mmask8 __U)
4364{
4366 (__v4df) __B,
4367 (__v4df) __C,
4368 (__mmask8)
4369 __U);
4370}
4371
4372extern __inline __m256d
4375 __m256d __C)
4376{
4378 (__v4df) __B,
4379 (__v4df) __C,
4380 (__mmask8)
4381 __U);
4382}
4383
4384extern __inline __m128d
4387 __m128d __C)
4388{
4390 (__v2df) __B,
4391 (__v2df) __C,
4392 (__mmask8) __U);
4393}
4394
4395extern __inline __m128d
4398 __mmask8 __U)
4399{
4401 (__v2df) __B,
4402 (__v2df) __C,
4403 (__mmask8)
4404 __U);
4405}
4406
4407extern __inline __m128d
4410 __m128d __C)
4411{
4413 (__v2df) __B,
4414 (__v2df) __C,
4415 (__mmask8)
4416 __U);
4417}
4418
4419extern __inline __m256
4422 __m256 __C)
4423{
4425 (__v8sf) __B,
4426 (__v8sf) __C,
4427 (__mmask8) __U);
4428}
4429
4430extern __inline __m256
4433 __mmask8 __U)
4434{
4436 (__v8sf) __B,
4437 (__v8sf) __C,
4438 (__mmask8) __U);
4439}
4440
4441extern __inline __m256
4444 __m256 __C)
4445{
4447 (__v8sf) __B,
4448 (__v8sf) __C,
4449 (__mmask8) __U);
4450}
4451
4452extern __inline __m128
4455{
4457 (__v4sf) __B,
4458 (__v4sf) __C,
4459 (__mmask8) __U);
4460}
4461
4462extern __inline __m128
4465 __mmask8 __U)
4466{
4468 (__v4sf) __B,
4469 (__v4sf) __C,
4470 (__mmask8) __U);
4471}
4472
4473extern __inline __m128
4476 __m128 __C)
4477{
4479 (__v4sf) __B,
4480 (__v4sf) __C,
4481 (__mmask8) __U);
4482}
4483
4484extern __inline __m256d
4487 __m256d __C)
4488{
4490 (__v4df) __B,
4491 -(__v4df) __C,
4492 (__mmask8) __U);
4493}
4494
4495extern __inline __m256d
4498 __mmask8 __U)
4499{
4501 (__v4df) __B,
4502 (__v4df) __C,
4503 (__mmask8)
4504 __U);
4505}
4506
4507extern __inline __m256d
4510 __m256d __C)
4511{
4513 (__v4df) __B,
4514 -(__v4df) __C,
4515 (__mmask8)
4516 __U);
4517}
4518
4519extern __inline __m128d
4522 __m128d __C)
4523{
4525 (__v2df) __B,
4526 -(__v2df) __C,
4527 (__mmask8) __U);
4528}
4529
4530extern __inline __m128d
4533 __mmask8 __U)
4534{
4536 (__v2df) __B,
4537 (__v2df) __C,
4538 (__mmask8)
4539 __U);
4540}
4541
4542extern __inline __m128d
4545 __m128d __C)
4546{
4548 (__v2df) __B,
4549 -(__v2df) __C,
4550 (__mmask8)
4551 __U);
4552}
4553
4554extern __inline __m256
4557 __m256 __C)
4558{
4560 (__v8sf) __B,
4561 -(__v8sf) __C,
4562 (__mmask8) __U);
4563}
4564
4565extern __inline __m256
4568 __mmask8 __U)
4569{
4571 (__v8sf) __B,
4572 (__v8sf) __C,
4573 (__mmask8) __U);
4574}
4575
4576extern __inline __m256
4579 __m256 __C)
4580{
4582 (__v8sf) __B,
4583 -(__v8sf) __C,
4584 (__mmask8) __U);
4585}
4586
4587extern __inline __m128
4590{
4592 (__v4sf) __B,
4593 -(__v4sf) __C,
4594 (__mmask8) __U);
4595}
4596
4597extern __inline __m128
4600 __mmask8 __U)
4601{
4603 (__v4sf) __B,
4604 (__v4sf) __C,
4605 (__mmask8) __U);
4606}
4607
4608extern __inline __m128
4611 __m128 __C)
4612{
4614 (__v4sf) __B,
4615 -(__v4sf) __C,
4616 (__mmask8) __U);
4617}
4618
4619extern __inline __m256d
4622 __m256d __C)
4623{
4625 (__v4df) __B,
4626 (__v4df) __C,
4627 (__mmask8) __U);
4628}
4629
4630extern __inline __m256d
4633 __mmask8 __U)
4634{
4636 (__v4df) __B,
4637 (__v4df) __C,
4638 (__mmask8) __U);
4639}
4640
4641extern __inline __m256d
4644 __m256d __C)
4645{
4647 (__v4df) __B,
4648 (__v4df) __C,
4649 (__mmask8) __U);
4650}
4651
4652extern __inline __m128d
4655 __m128d __C)
4656{
4658 (__v2df) __B,
4659 (__v2df) __C,
4660 (__mmask8) __U);
4661}
4662
4663extern __inline __m128d
4666 __mmask8 __U)
4667{
4669 (__v2df) __B,
4670 (__v2df) __C,
4671 (__mmask8) __U);
4672}
4673
4674extern __inline __m128d
4677 __m128d __C)
4678{
4680 (__v2df) __B,
4681 (__v2df) __C,
4682 (__mmask8) __U);
4683}
4684
4685extern __inline __m256
4688 __m256 __C)
4689{
4691 (__v8sf) __B,
4692 (__v8sf) __C,
4693 (__mmask8) __U);
4694}
4695
4696extern __inline __m256
4699 __mmask8 __U)
4700{
4702 (__v8sf) __B,
4703 (__v8sf) __C,
4704 (__mmask8) __U);
4705}
4706
4707extern __inline __m256
4710 __m256 __C)
4711{
4713 (__v8sf) __B,
4714 (__v8sf) __C,
4715 (__mmask8) __U);
4716}
4717
4718extern __inline __m128
4721{
4723 (__v4sf) __B,
4724 (__v4sf) __C,
4725 (__mmask8) __U);
4726}
4727
4728extern __inline __m128
4731{
4733 (__v4sf) __B,
4734 (__v4sf) __C,
4735 (__mmask8) __U);
4736}
4737
4738extern __inline __m128
4741{
4743 (__v4sf) __B,
4744 (__v4sf) __C,
4745 (__mmask8) __U);
4746}
4747
4748extern __inline __m256d
4751 __m256d __C)
4752{
4754 (__v4df) __B,
4755 (__v4df) __C,
4756 (__mmask8) __U);
4757}
4758
4759extern __inline __m256d
4762 __mmask8 __U)
4763{
4765 (__v4df) __B,
4766 (__v4df) __C,
4767 (__mmask8) __U);
4768}
4769
4770extern __inline __m256d
4773 __m256d __C)
4774{
4776 (__v4df) __B,
4777 (__v4df) __C,
4778 (__mmask8) __U);
4779}
4780
4781extern __inline __m128d
4784 __m128d __C)
4785{
4787 (__v2df) __B,
4788 (__v2df) __C,
4789 (__mmask8) __U);
4790}
4791
4792extern __inline __m128d
4795 __mmask8 __U)
4796{
4798 (__v2df) __B,
4799 (__v2df) __C,
4800 (__mmask8) __U);
4801}
4802
4803extern __inline __m128d
4806 __m128d __C)
4807{
4809 (__v2df) __B,
4810 (__v2df) __C,
4811 (__mmask8) __U);
4812}
4813
4814extern __inline __m256
4817 __m256 __C)
4818{
4820 (__v8sf) __B,
4821 (__v8sf) __C,
4822 (__mmask8) __U);
4823}
4824
4825extern __inline __m256
4828 __mmask8 __U)
4829{
4831 (__v8sf) __B,
4832 (__v8sf) __C,
4833 (__mmask8) __U);
4834}
4835
4836extern __inline __m256
4839 __m256 __C)
4840{
4842 (__v8sf) __B,
4843 (__v8sf) __C,
4844 (__mmask8) __U);
4845}
4846
4847extern __inline __m128
4850{
4852 (__v4sf) __B,
4853 (__v4sf) __C,
4854 (__mmask8) __U);
4855}
4856
4857extern __inline __m128
4860{
4862 (__v4sf) __B,
4863 (__v4sf) __C,
4864 (__mmask8) __U);
4865}
4866
4867extern __inline __m128
4870{
4872 (__v4sf) __B,
4873 (__v4sf) __C,
4874 (__mmask8) __U);
4875}
4876
4877extern __inline __m128i
4880 __m128i __B)
4881{
4883 (__v4si) __B,
4884 (__v4si) __W,
4885 (__mmask8) __U);
4886}
4887
4888extern __inline __m128i
4891{
4893 (__v4si) __B,
4894 (__v4si)
4896 (__mmask8) __U);
4897}
4898
4899extern __inline __m256i
4902 __m256i __B)
4903{
4905 (__v8si) __B,
4906 (__v8si) __W,
4907 (__mmask8) __U);
4908}
4909
4910extern __inline __m256i
4913{
4915 (__v8si) __B,
4916 (__v8si)
4918 (__mmask8) __U);
4919}
4920
4921extern __inline __m128i
4924 __m128i __B)
4925{
4927 (__v4si) __B,
4928 (__v4si) __W,
4929 (__mmask8) __U);
4930}
4931
4932extern __inline __m128i
4935{
4937 (__v4si) __B,
4938 (__v4si)
4940 (__mmask8) __U);
4941}
4942
4943extern __inline __m256i
4946 __m256i __B)
4947{
4949 (__v8si) __B,
4950 (__v8si) __W,
4951 (__mmask8) __U);
4952}
4953
4954extern __inline __m256i
4957{
4959 (__v8si) __B,
4960 (__v8si)
4962 (__mmask8) __U);
4963}
4964
4967{
4968 return (__m256i) ((__v8su)__A | (__v8su)__B);
4969}
4970
4971extern __inline __m128i
4974{
4976 (__v4si) __B,
4977 (__v4si) __W,
4978 (__mmask8) __U);
4979}
4980
4981extern __inline __m128i
4984{
4986 (__v4si) __B,
4987 (__v4si)
4989 (__mmask8) __U);
4990}
4991
4994{
4995 return (__m128i) ((__v4su)__A | (__v4su)__B);
4996}
4997
4998extern __inline __m256i
5001 __m256i __B)
5002{
5004 (__v8si) __B,
5005 (__v8si) __W,
5006 (__mmask8) __U);
5007}
5008
5009extern __inline __m256i
5012{
5014 (__v8si) __B,
5015 (__v8si)
5017 (__mmask8) __U);
5018}
5019
5022{
5023 return (__m256i) ((__v8su)__A ^ (__v8su)__B);
5024}
5025
5026extern __inline __m128i
5029 __m128i __B)
5030{
5032 (__v4si) __B,
5033 (__v4si) __W,
5034 (__mmask8) __U);
5035}
5036
5037extern __inline __m128i
5040{
5042 (__v4si) __B,
5043 (__v4si)
5045 (__mmask8) __U);
5046}
5047
5050{
5051 return (__m128i) ((__v4su)__A ^ (__v4su)__B);
5052}
5053
5054extern __inline __m128
5057{
5059 (__v4sf) __W,
5060 (__mmask8) __U);
5061}
5062
5063extern __inline __m128
5066{
5068 (__v4sf)
5069 _mm_setzero_ps (),
5070 (__mmask8) __U);
5071}
5072
5073extern __inline __m128
5076{
5078 (__v4sf) __W,
5079 (__mmask8) __U);
5080}
5081
5082extern __inline __m128
5085{
5087 (__v4sf)
5088 _mm_setzero_ps (),
5089 (__mmask8) __U);
5090}
5091
5092extern __inline __m256i
5095{
5097 (__v8si) __W,
5098 (__mmask8) __U);
5099}
5100
5101extern __inline __m256i
5104{
5106 (__v8si)
5108 (__mmask8) __U);
5109}
5110
5111extern __inline __m128i
5114{
5116 (__v4si) __W,
5117 (__mmask8) __U);
5118}
5119
5120extern __inline __m128i
5123{
5125 (__v4si)
5127 (__mmask8) __U);
5128}
5129
5130extern __inline __m256i
5133{
5135 (__v8si)
5137 (__mmask8) -1);
5138}
5139
5140extern __inline __m256i
5143{
5145 (__v8si) __W,
5146 (__mmask8) __U);
5147}
5148
5149extern __inline __m256i
5152{
5154 (__v8si)
5156 (__mmask8) __U);
5157}
5158
5159extern __inline __m128i
5162{
5164 (__v4si)
5166 (__mmask8) -1);
5167}
5168
5169extern __inline __m128i
5172{
5174 (__v4si) __W,
5175 (__mmask8) __U);
5176}
5177
5178extern __inline __m128i
5181{
5183 (__v4si)
5185 (__mmask8) __U);
5186}
5187
5188extern __inline __m256d
5191{
5193 (__v4df) __W,
5194 (__mmask8) __U);
5195}
5196
5197extern __inline __m256d
5200{
5202 (__v4df)
5204 (__mmask8) __U);
5205}
5206
5207extern __inline __m128d
5210{
5212 (__v2df) __W,
5213 (__mmask8) __U);
5214}
5215
5216extern __inline __m128d
5219{
5221 (__v2df)
5222 _mm_setzero_pd (),
5223 (__mmask8) __U);
5224}
5225
5226extern __inline __m256
5229{
5231 (__v8sf) __W,
5232 (__mmask8) __U);
5233}
5234
5235extern __inline __m256
5238{
5240 (__v8sf)
5242 (__mmask8) __U);
5243}
5244
5245extern __inline __m128
5248{
5250 (__v4sf) __W,
5251 (__mmask8) __U);
5252}
5253
5254extern __inline __m128
5257{
5259 (__v4sf)
5260 _mm_setzero_ps (),
5261 (__mmask8) __U);
5262}
5263
5264extern __inline __m256
5267{
5269 (__v8sf) __W,
5270 (__mmask8) __U);
5271}
5272
5273extern __inline __m256
5276{
5278 (__v8sf)
5280 (__mmask8) __U);
5281}
5282
5283extern __inline __m128
5286{
5288 (__v4sf) __W,
5289 (__mmask8) __U);
5290}
5291
5292extern __inline __m128
5295{
5297 (__v4sf)
5298 _mm_setzero_ps (),
5299 (__mmask8) __U);
5300}
5301
5302extern __inline __m128i
5305 __m128i __B)
5306{
5308 (__v4si) __B,
5309 (__v4si) __W,
5310 (__mmask8) __U);
5311}
5312
5313extern __inline __m128i
5316{
5318 (__v4si) __B,
5319 (__v4si)
5321 (__mmask8) __U);
5322}
5323
5324extern __inline __m256i
5327 __m256i __B)
5328{
5330 (__v8si) __B,
5331 (__v8si) __W,
5332 (__mmask8) __U);
5333}
5334
5335extern __inline __m256i
5338{
5340 (__v8si) __B,
5341 (__v8si)
5343 (__mmask8) __U);
5344}
5345
5346extern __inline __m128i
5349 __m128i __B)
5350{
5352 (__v2di) __B,
5353 (__v2di) __W,
5354 (__mmask8) __U);
5355}
5356
5357extern __inline __m128i
5360{
5362 (__v2di) __B,
5363 (__v2di)
5365 (__mmask8) __U);
5366}
5367
5368extern __inline __m256i
5371 __m256i __B)
5372{
5374 (__v4di) __B,
5375 (__v4di) __W,
5376 (__mmask8) __U);
5377}
5378
5379extern __inline __m256i
5382{
5384 (__v4di) __B,
5385 (__v4di)
5387 (__mmask8) __U);
5388}
5389
5390extern __inline __m128i
5393 __m128i __B)
5394{
5396 (__v4si) __B,
5397 (__v4si) __W,
5398 (__mmask8) __U);
5399}
5400
5401extern __inline __m128i
5404{
5406 (__v4si) __B,
5407 (__v4si)
5409 (__mmask8) __U);
5410}
5411
5412extern __inline __m256i
5415 __m256i __B)
5416{
5418 (__v8si) __B,
5419 (__v8si) __W,
5420 (__mmask8) __U);
5421}
5422
5423extern __inline __m256i
5426{
5428 (__v8si) __B,
5429 (__v8si)
5431 (__mmask8) __U);
5432}
5433
5434extern __inline __m128i
5437 __m128i __B)
5438{
5440 (__v2di) __B,
5441 (__v2di) __W,
5442 (__mmask8) __U);
5443}
5444
5445extern __inline __m128i
5448{
5450 (__v2di) __B,
5451 (__v2di)
5453 (__mmask8) __U);
5454}
5455
5456extern __inline __m256i
5459 __m256i __B)
5460{
5462 (__v4di) __B,
5463 (__v4di) __W,
5464 (__mmask8) __U);
5465}
5466
5467extern __inline __m256i
5470{
5472 (__v4di) __B,
5473 (__v4di)
5475 (__mmask8) __U);
5476}
5477
5478extern __inline __mmask8
5481{
5483 (__v4si) __B, 0,
5484 (__mmask8) -1);
5485}
5486
5487extern __inline __mmask8
5490{
5492 (__v4si) __B,
5493 (__mmask8) -1);
5494}
5495
5496extern __inline __mmask8
5499{
5501 (__v4si) __B, 0, __U);
5502}
5503
5504extern __inline __mmask8
5507{
5509 (__v4si) __B, __U);
5510}
5511
5512extern __inline __mmask8
5515{
5517 (__v8si) __B, 0,
5518 (__mmask8) -1);
5519}
5520
5521extern __inline __mmask8
5524{
5526 (__v8si) __B,
5527 (__mmask8) -1);
5528}
5529
5530extern __inline __mmask8
5533{
5535 (__v8si) __B, 0, __U);
5536}
5537
5538extern __inline __mmask8
5541{
5543 (__v8si) __B, __U);
5544}
5545
5546extern __inline __mmask8
5549{
5551 (__v2di) __B, 0,
5552 (__mmask8) -1);
5553}
5554
5555extern __inline __mmask8
5558{
5560 (__v2di) __B,
5561 (__mmask8) -1);
5562}
5563
5564extern __inline __mmask8
5567{
5569 (__v2di) __B, 0, __U);
5570}
5571
5572extern __inline __mmask8
5575{
5577 (__v2di) __B, __U);
5578}
5579
5580extern __inline __mmask8
5583{
5585 (__v4di) __B, 0,
5586 (__mmask8) -1);
5587}
5588
5589extern __inline __mmask8
5592{
5594 (__v4di) __B,
5595 (__mmask8) -1);
5596}
5597
5598extern __inline __mmask8
5601{
5603 (__v4di) __B, 0, __U);
5604}
5605
5606extern __inline __mmask8
5609{
5611 (__v4di) __B, __U);
5612}
5613
5614extern __inline __mmask8
5617{
5619 (__v4si) __B, 6,
5620 (__mmask8) -1);
5621}
5622
5623extern __inline __mmask8
5626{
5628 (__v4si) __B,
5629 (__mmask8) -1);
5630}
5631
5632extern __inline __mmask8
5635{
5637 (__v4si) __B, 6, __U);
5638}
5639
5640extern __inline __mmask8
5643{
5645 (__v4si) __B, __U);
5646}
5647
5648extern __inline __mmask8
5651{
5653 (__v8si) __B, 6,
5654 (__mmask8) -1);
5655}
5656
5657extern __inline __mmask8
5660{
5662 (__v8si) __B,
5663 (__mmask8) -1);
5664}
5665
5666extern __inline __mmask8
5669{
5671 (__v8si) __B, 6, __U);
5672}
5673
5674extern __inline __mmask8
5677{
5679 (__v8si) __B, __U);
5680}
5681
5682extern __inline __mmask8
5685{
5687 (__v2di) __B, 6,
5688 (__mmask8) -1);
5689}
5690
5691extern __inline __mmask8
5694{
5696 (__v2di) __B,
5697 (__mmask8) -1);
5698}
5699
5700extern __inline __mmask8
5703{
5705 (__v2di) __B, 6, __U);
5706}
5707
5708extern __inline __mmask8
5711{
5713 (__v2di) __B, __U);
5714}
5715
5716extern __inline __mmask8
5719{
5721 (__v4di) __B, 6,
5722 (__mmask8) -1);
5723}
5724
5725extern __inline __mmask8
5728{
5730 (__v4di) __B,
5731 (__mmask8) -1);
5732}
5733
5734extern __inline __mmask8
5737{
5739 (__v4di) __B, 6, __U);
5740}
5741
5742extern __inline __mmask8
5745{
5747 (__v4di) __B, __U);
5748}
5749
5750extern __inline __mmask8
5753{
5755 (__v4si) __B,
5756 (__mmask8) -1);
5757}
5758
5759extern __inline __mmask8
5762{
5764 (__v4si) __B, __U);
5765}
5766
5767extern __inline __mmask8
5770{
5772 (__v8si) __B,
5773 (__mmask8) -1);
5774}
5775
5776extern __inline __mmask8
5779{
5781 (__v8si) __B, __U);
5782}
5783
5784extern __inline __mmask8
5787{
5789 (__v2di) __B,
5790 (__mmask8) -1);
5791}
5792
5793extern __inline __mmask8
5796{
5798 (__v2di) __B, __U);
5799}
5800
5801extern __inline __mmask8
5804{
5806 (__v4di) __B,
5807 (__mmask8) -1);
5808}
5809
5810extern __inline __mmask8
5813{
5815 (__v4di) __B, __U);
5816}
5817
5818extern __inline __mmask8
5821{
5823 (__v4si) __B,
5824 (__mmask8) -1);
5825}
5826
5827extern __inline __mmask8
5830{
5832 (__v4si) __B, __U);
5833}
5834
5835extern __inline __mmask8
5838{
5840 (__v8si) __B,
5841 (__mmask8) -1);
5842}
5843
5844extern __inline __mmask8
5847{
5849 (__v8si) __B, __U);
5850}
5851
5852extern __inline __mmask8
5855{
5857 (__v2di) __B,
5858 (__mmask8) -1);
5859}
5860
5861extern __inline __mmask8
5864{
5866 (__v2di) __B, __U);
5867}
5868
5869extern __inline __mmask8
5872{
5874 (__v4di) __B,
5875 (__mmask8) -1);
5876}
5877
5878extern __inline __mmask8
5881{
5883 (__v4di) __B, __U);
5884}
5885
5886extern __inline __m256d
5889{
5891 (__v4df) __W,
5892 (__mmask8) __U);
5893}
5894
5895extern __inline __m256d
5898{
5900 (__v4df)
5902 (__mmask8) __U);
5903}
5904
5905extern __inline void
5908{
5910 (__v4df) __A,
5911 (__mmask8) __U);
5912}
5913
5914extern __inline __m128d
5917{
5919 (__v2df) __W,
5920 (__mmask8) __U);
5921}
5922
5923extern __inline __m128d
5926{
5928 (__v2df)
5929 _mm_setzero_pd (),
5930 (__mmask8) __U);
5931}
5932
5933extern __inline void
5936{
5938 (__v2df) __A,
5939 (__mmask8) __U);
5940}
5941
5942extern __inline __m256
5945{
5947 (__v8sf) __W,
5948 (__mmask8) __U);
5949}
5950
5951extern __inline __m256
5954{
5956 (__v8sf)
5958 (__mmask8) __U);
5959}
5960
5961extern __inline void
5964{
5966 (__v8sf) __A,
5967 (__mmask8) __U);
5968}
5969
5970extern __inline __m128
5973{
5975 (__v4sf) __W,
5976 (__mmask8) __U);
5977}
5978
5979extern __inline __m128
5982{
5984 (__v4sf)
5985 _mm_setzero_ps (),
5986 (__mmask8) __U);
5987}
5988
5989extern __inline void
5992{
5994 (__v4sf) __A,
5995 (__mmask8) __U);
5996}
5997
5998extern __inline __m256i
6001{
6003 (__v4di) __W,
6004 (__mmask8) __U);
6005}
6006
6007extern __inline __m256i
6010{
6012 (__v4di)
6014 (__mmask8) __U);
6015}
6016
6017extern __inline void
6020{
6022 (__v4di) __A,
6023 (__mmask8) __U);
6024}
6025
6026extern __inline __m128i
6029{
6031 (__v2di) __W,
6032 (__mmask8) __U);
6033}
6034
6035extern __inline __m128i
6038{
6040 (__v2di)
6042 (__mmask8) __U);
6043}
6044
6045extern __inline void
6048{
6050 (__v2di) __A,
6051 (__mmask8) __U);
6052}
6053
6054extern __inline __m256i
6057{
6059 (__v8si) __W,
6060 (__mmask8) __U);
6061}
6062
6063extern __inline __m256i
6066{
6068 (__v8si)
6070 (__mmask8) __U);
6071}
6072
6073extern __inline void
6076{
6078 (__v8si) __A,
6079 (__mmask8) __U);
6080}
6081
6082extern __inline __m128i
6085{
6087 (__v4si) __W,
6088 (__mmask8) __U);
6089}
6090
6091extern __inline __m128i
6094{
6096 (__v4si)
6098 (__mmask8) __U);
6099}
6100
6101extern __inline void
6104{
6106 (__v4si) __A,
6107 (__mmask8) __U);
6108}
6109
6110extern __inline __m256d
6113{
6115 (__v4df) __W,
6116 (__mmask8) __U);
6117}
6118
6119extern __inline __m256d
6122{
6124 (__v4df)
6126 (__mmask8) __U);
6127}
6128
6129extern __inline __m256d
6132{
6134 (__v4df) __W,
6135 (__mmask8)
6136 __U);
6137}
6138
6139extern __inline __m256d
6142{
6144 (__v4df)
6146 (__mmask8)
6147 __U);
6148}
6149
6150extern __inline __m128d
6153{
6155 (__v2df) __W,
6156 (__mmask8) __U);
6157}
6158
6159extern __inline __m128d
6162{
6164 (__v2df)
6165 _mm_setzero_pd (),
6166 (__mmask8) __U);
6167}
6168
6169extern __inline __m128d
6172{
6174 (__v2df) __W,
6175 (__mmask8)
6176 __U);
6177}
6178
6179extern __inline __m128d
6182{
6184 (__v2df)
6185 _mm_setzero_pd (),
6186 (__mmask8)
6187 __U);
6188}
6189
6190extern __inline __m256
6193{
6195 (__v8sf) __W,
6196 (__mmask8) __U);
6197}
6198
6199extern __inline __m256
6202{
6204 (__v8sf)
6206 (__mmask8) __U);
6207}
6208
6209extern __inline __m256
6212{
6214 (__v8sf) __W,
6215 (__mmask8) __U);
6216}
6217
6218extern __inline __m256
6221{
6223 (__v8sf)
6225 (__mmask8)
6226 __U);
6227}
6228
6229extern __inline __m128
6232{
6234 (__v4sf) __W,
6235 (__mmask8) __U);
6236}
6237
6238extern __inline __m128
6241{
6243 (__v4sf)
6244 _mm_setzero_ps (),
6245 (__mmask8) __U);
6246}
6247
6248extern __inline __m128
6251{
6253 (__v4sf) __W,
6254 (__mmask8) __U);
6255}
6256
6257extern __inline __m128
6260{
6262 (__v4sf)
6263 _mm_setzero_ps (),
6264 (__mmask8)
6265 __U);
6266}
6267
6268extern __inline __m256i
6271{
6273 (__v4di) __W,
6274 (__mmask8) __U);
6275}
6276
6277extern __inline __m256i
6280{
6282 (__v4di)
6284 (__mmask8) __U);
6285}
6286
6287extern __inline __m256i
6290 void const *__P)
6291{
6293 (__v4di) __W,
6294 (__mmask8)
6295 __U);
6296}
6297
6298extern __inline __m256i
6301{
6303 (__v4di)
6305 (__mmask8)
6306 __U);
6307}
6308
6309extern __inline __m128i
6312{
6314 (__v2di) __W,
6315 (__mmask8) __U);
6316}
6317
6318extern __inline __m128i
6321{
6323 (__v2di)
6325 (__mmask8) __U);
6326}
6327
6328extern __inline __m128i
6331{
6333 (__v2di) __W,
6334 (__mmask8)
6335 __U);
6336}
6337
6338extern __inline __m128i
6341{
6343 (__v2di)
6345 (__mmask8)
6346 __U);
6347}
6348
6349extern __inline __m256i
6352{
6354 (__v8si) __W,
6355 (__mmask8) __U);
6356}
6357
6358extern __inline __m256i
6361{
6363 (__v8si)
6365 (__mmask8) __U);
6366}
6367
6368extern __inline __m256i
6371 void const *__P)
6372{
6374 (__v8si) __W,
6375 (__mmask8)
6376 __U);
6377}
6378
6379extern __inline __m256i
6382{
6384 (__v8si)
6386 (__mmask8)
6387 __U);
6388}
6389
6390extern __inline __m128i
6393{
6395 (__v4si) __W,
6396 (__mmask8) __U);
6397}
6398
6399extern __inline __m128i
6402{
6404 (__v4si)
6406 (__mmask8) __U);
6407}
6408
6409extern __inline __m128i
6412{
6414 (__v4si) __W,
6415 (__mmask8)
6416 __U);
6417}
6418
6419extern __inline __m128i
6422{
6424 (__v4si)
6426 (__mmask8)
6427 __U);
6428}
6429
6430extern __inline __m256d
6433{
6435 /* idx */ ,
6436 (__v4df) __A,
6437 (__v4df) __B,
6438 (__mmask8) -1);
6439}
6440
6441extern __inline __m256d
6444 __m256d __B)
6445{
6447 /* idx */ ,
6448 (__v4df) __A,
6449 (__v4df) __B,
6450 (__mmask8)
6451 __U);
6452}
6453
6454extern __inline __m256d
6457 __m256d __B)
6458{
6460 (__v4di) __I
6461 /* idx */ ,
6462 (__v4df) __B,
6463 (__mmask8)
6464 __U);
6465}
6466
6467extern __inline __m256d
6470 __m256d __B)
6471{
6473 /* idx */ ,
6474 (__v4df) __A,
6475 (__v4df) __B,
6476 (__mmask8)
6477 __U);
6478}
6479
6480extern __inline __m256
6483{
6485 /* idx */ ,
6486 (__v8sf) __A,
6487 (__v8sf) __B,
6488 (__mmask8) -1);
6489}
6490
6491extern __inline __m256
6494 __m256 __B)
6495{
6497 /* idx */ ,
6498 (__v8sf) __A,
6499 (__v8sf) __B,
6500 (__mmask8) __U);
6501}
6502
6503extern __inline __m256
6506 __m256 __B)
6507{
6509 (__v8si) __I
6510 /* idx */ ,
6511 (__v8sf) __B,
6512 (__mmask8) __U);
6513}
6514
6515extern __inline __m256
6518 __m256 __B)
6519{
6521 /* idx */ ,
6522 (__v8sf) __A,
6523 (__v8sf) __B,
6524 (__mmask8)
6525 __U);
6526}
6527
6528extern __inline __m128i
6531{
6533 /* idx */ ,
6534 (__v2di) __A,
6535 (__v2di) __B,
6536 (__mmask8) -1);
6537}
6538
6539extern __inline __m128i
6542 __m128i __B)
6543{
6545 /* idx */ ,
6546 (__v2di) __A,
6547 (__v2di) __B,
6548 (__mmask8) __U);
6549}
6550
6551extern __inline __m128i
6554 __m128i __B)
6555{
6557 (__v2di) __I
6558 /* idx */ ,
6559 (__v2di) __B,
6560 (__mmask8) __U);
6561}
6562
6563extern __inline __m128i
6566 __m128i __B)
6567{
6569 /* idx */ ,
6570 (__v2di) __A,
6571 (__v2di) __B,
6572 (__mmask8)
6573 __U);
6574}
6575
6576extern __inline __m128i
6579{
6581 /* idx */ ,
6582 (__v4si) __A,
6583 (__v4si) __B,
6584 (__mmask8) -1);
6585}
6586
6587extern __inline __m128i
6590 __m128i __B)
6591{
6593 /* idx */ ,
6594 (__v4si) __A,
6595 (__v4si) __B,
6596 (__mmask8) __U);
6597}
6598
6599extern __inline __m128i
6602 __m128i __B)
6603{
6605 (__v4si) __I
6606 /* idx */ ,
6607 (__v4si) __B,
6608 (__mmask8) __U);
6609}
6610
6611extern __inline __m128i
6614 __m128i __B)
6615{
6617 /* idx */ ,
6618 (__v4si) __A,
6619 (__v4si) __B,
6620 (__mmask8)
6621 __U);
6622}
6623
6624extern __inline __m256i
6627{
6629 /* idx */ ,
6630 (__v4di) __A,
6631 (__v4di) __B,
6632 (__mmask8) -1);
6633}
6634
6635extern __inline __m256i
6638 __m256i __B)
6639{
6641 /* idx */ ,
6642 (__v4di) __A,
6643 (__v4di) __B,
6644 (__mmask8) __U);
6645}
6646
6647extern __inline __m256i
6651{
6653 (__v4di) __I
6654 /* idx */ ,
6655 (__v4di) __B,
6656 (__mmask8) __U);
6657}
6658
6659extern __inline __m256i
6663{
6665 /* idx */ ,
6666 (__v4di) __A,
6667 (__v4di) __B,
6668 (__mmask8)
6669 __U);
6670}
6671
6672extern __inline __m256i
6675{
6677 /* idx */ ,
6678 (__v8si) __A,
6679 (__v8si) __B,
6680 (__mmask8) -1);
6681}
6682
6683extern __inline __m256i
6686 __m256i __B)
6687{
6689 /* idx */ ,
6690 (__v8si) __A,
6691 (__v8si) __B,
6692 (__mmask8) __U);
6693}
6694
6695extern __inline __m256i
6699{
6701 (__v8si) __I
6702 /* idx */ ,
6703 (__v8si) __B,
6704 (__mmask8) __U);
6705}
6706
6707extern __inline __m256i
6711{
6713 /* idx */ ,
6714 (__v8si) __A,
6715 (__v8si) __B,
6716 (__mmask8)
6717 __U);
6718}
6719
6720extern __inline __m128d
6723{
6725 /* idx */ ,
6726 (__v2df) __A,
6727 (__v2df) __B,
6728 (__mmask8) -1);
6729}
6730
6731extern __inline __m128d
6734 __m128d __B)
6735{
6737 /* idx */ ,
6738 (__v2df) __A,
6739 (__v2df) __B,
6740 (__mmask8)
6741 __U);
6742}
6743
6744extern __inline __m128d
6747 __m128d __B)
6748{
6750 (__v2di) __I
6751 /* idx */ ,
6752 (__v2df) __B,
6753 (__mmask8)
6754 __U);
6755}
6756
6757extern __inline __m128d
6760 __m128d __B)
6761{
6763 /* idx */ ,
6764 (__v2df) __A,
6765 (__v2df) __B,
6766 (__mmask8)
6767 __U);
6768}
6769
6770extern __inline __m128
6773{
6775 /* idx */ ,
6776 (__v4sf) __A,
6777 (__v4sf) __B,
6778 (__mmask8) -1);
6779}
6780
6781extern __inline __m128
6784 __m128 __B)
6785{
6787 /* idx */ ,
6788 (__v4sf) __A,
6789 (__v4sf) __B,
6790 (__mmask8) __U);
6791}
6792
6793extern __inline __m128
6796 __m128 __B)
6797{
6799 (__v4si) __I
6800 /* idx */ ,
6801 (__v4sf) __B,
6802 (__mmask8) __U);
6803}
6804
6805extern __inline __m128
6808 __m128 __B)
6809{
6811 /* idx */ ,
6812 (__v4sf) __A,
6813 (__v4sf) __B,
6814 (__mmask8)
6815 __U);
6816}
6817
6818extern __inline __m128i
6821{
6823 (__v2di) __Y,
6824 (__v2di)
6826 (__mmask8) -1);
6827}
6828
6829extern __inline __m128i
6832 __m128i __Y)
6833{
6835 (__v2di) __Y,
6836 (__v2di) __W,
6837 (__mmask8) __U);
6838}
6839
6840extern __inline __m128i
6843{
6845 (__v2di) __Y,
6846 (__v2di)
6848 (__mmask8) __U);
6849}
6850
6851extern __inline __m256i
6854 __m256i __Y)
6855{
6857 (__v8si) __Y,
6858 (__v8si) __W,
6859 (__mmask8) __U);
6860}
6861
6862extern __inline __m256i
6865{
6867 (__v8si) __Y,
6868 (__v8si)
6870 (__mmask8) __U);
6871}
6872
6873extern __inline __m128i
6876 __m128i __Y)
6877{
6879 (__v4si) __Y,
6880 (__v4si) __W,
6881 (__mmask8) __U);
6882}
6883
6884extern __inline __m128i
6887{
6889 (__v4si) __Y,
6890 (__v4si)
6892 (__mmask8) __U);
6893}
6894
6895extern __inline __m256i
6898 __m256i __Y)
6899{
6901 (__v4di) __Y,
6902 (__v4di) __W,
6903 (__mmask8) __U);
6904}
6905
6906extern __inline __m256i
6909{
6911 (__v4di) __Y,
6912 (__v4di)
6914 (__mmask8) __U);
6915}
6916
6917extern __inline __m128i
6920 __m128i __Y)
6921{
6923 (__v2di) __Y,
6924 (__v2di) __W,
6925 (__mmask8) __U);
6926}
6927
6928extern __inline __m128i
6931{
6933 (__v2di) __Y,
6934 (__v2di)
6936 (__mmask8) __U);
6937}
6938
6939extern __inline __m256i
6942 __m256i __Y)
6943{
6945 (__v8si) __Y,
6946 (__v8si) __W,
6947 (__mmask8) __U);
6948}
6949
6950extern __inline __m256i
6953{
6955 (__v8si) __Y,
6956 (__v8si)
6958 (__mmask8) __U);
6959}
6960
6961extern __inline __m128i
6964 __m128i __Y)
6965{
6967 (__v4si) __Y,
6968 (__v4si) __W,
6969 (__mmask8) __U);
6970}
6971
6972extern __inline __m128i
6975{
6977 (__v4si) __Y,
6978 (__v4si)
6980 (__mmask8) __U);
6981}
6982
6983extern __inline __m256i
6986 __m256i __Y)
6987{
6989 (__v8si) __Y,
6990 (__v8si) __W,
6991 (__mmask8) __U);
6992}
6993
6994extern __inline __m256i
6997{
6999 (__v8si) __Y,
7000 (__v8si)
7002 (__mmask8) __U);
7003}
7004
7005extern __inline __m128i
7008 __m128i __Y)
7009{
7011 (__v4si) __Y,
7012 (__v4si) __W,
7013 (__mmask8) __U);
7014}
7015
7016extern __inline __m128i
7019{
7021 (__v4si) __Y,
7022 (__v4si)
7024 (__mmask8) __U);
7025}
7026
7027extern __inline __m256i
7030 __m256i __Y)
7031{
7033 (__v4di) __Y,
7034 (__v4di) __W,
7035 (__mmask8) __U);
7036}
7037
7038extern __inline __m256i
7041{
7043 (__v4di) __Y,
7044 (__v4di)
7046 (__mmask8) __U);
7047}
7048
7049extern __inline __m128i
7052 __m128i __Y)
7053{
7055 (__v2di) __Y,
7056 (__v2di) __W,
7057 (__mmask8) __U);
7058}
7059
7060extern __inline __m128i
7063{
7065 (__v2di) __Y,
7066 (__v2di)
7068 (__mmask8) __U);
7069}
7070
7071extern __inline __m256i
7074{
7076 (__v8si) __B,
7077 (__v8si)
7079 (__mmask8) -1);
7080}
7081
7082extern __inline __m256i
7085 __m256i __B)
7086{
7088 (__v8si) __B,
7089 (__v8si) __W,
7090 (__mmask8) __U);
7091}
7092
7093extern __inline __m256i
7096{
7098 (__v8si) __B,
7099 (__v8si)
7101 (__mmask8) __U);
7102}
7103
7104extern __inline __m128i
7107{
7109 (__v4si) __B,
7110 (__v4si)
7112 (__mmask8) -1);
7113}
7114
7115extern __inline __m128i
7118 __m128i __B)
7119{
7121 (__v4si) __B,
7122 (__v4si) __W,
7123 (__mmask8) __U);
7124}
7125
7126extern __inline __m128i
7129{
7131 (__v4si) __B,
7132 (__v4si)
7134 (__mmask8) __U);
7135}
7136
7137extern __inline __m256i
7140{
7142 (__v8si) __B,
7143 (__v8si)
7145 (__mmask8) -1);
7146}
7147
7148extern __inline __m256i
7151 __m256i __B)
7152{
7154 (__v8si) __B,
7155 (__v8si) __W,
7156 (__mmask8) __U);
7157}
7158
7159extern __inline __m256i
7162{
7164 (__v8si) __B,
7165 (__v8si)
7167 (__mmask8) __U);
7168}
7169
7170extern __inline __m128i
7173{
7175 (__v4si) __B,
7176 (__v4si)
7178 (__mmask8) -1);
7179}
7180
7181extern __inline __m128i
7184 __m128i __B)
7185{
7187 (__v4si) __B,
7188 (__v4si) __W,
7189 (__mmask8) __U);
7190}
7191
7192extern __inline __m128i
7195{
7197 (__v4si) __B,
7198 (__v4si)
7200 (__mmask8) __U);
7201}
7202
7203extern __inline __m256i
7206{
7208 (__v4di) __B,
7209 (__v4di)
7211 (__mmask8) -1);
7212}
7213
7214extern __inline __m256i
7217 __m256i __B)
7218{
7220 (__v4di) __B,
7221 (__v4di) __W,
7222 (__mmask8) __U);
7223}
7224
7225extern __inline __m256i
7228{
7230 (__v4di) __B,
7231 (__v4di)
7233 (__mmask8) __U);
7234}
7235
7236extern __inline __m128i
7239{
7241 (__v2di) __B,
7242 (__v2di)
7244 (__mmask8) -1);
7245}
7246
7247extern __inline __m128i
7250 __m128i __B)
7251{
7253 (__v2di) __B,
7254 (__v2di) __W,
7255 (__mmask8) __U);
7256}
7257
7258extern __inline __m128i
7261{
7263 (__v2di) __B,
7264 (__v2di)
7266 (__mmask8) __U);
7267}
7268
7269extern __inline __m256i
7272{
7274 (__v4di) __B,
7275 (__v4di)
7277 (__mmask8) -1);
7278}
7279
7280extern __inline __m256i
7283 __m256i __B)
7284{
7286 (__v4di) __B,
7287 (__v4di) __W,
7288 (__mmask8) __U);
7289}
7290
7291extern __inline __m256i
7294{
7296 (__v4di) __B,
7297 (__v4di)
7299 (__mmask8) __U);
7300}
7301
7302extern __inline __m128i
7305{
7307 (__v2di) __B,
7308 (__v2di)
7310 (__mmask8) -1);
7311}
7312
7313extern __inline __m128i
7316 __m128i __B)
7317{
7319 (__v2di) __B,
7320 (__v2di) __W,
7321 (__mmask8) __U);
7322}
7323
7324extern __inline __m128i
7327{
7329 (__v2di) __B,
7330 (__v2di)
7332 (__mmask8) __U);
7333}
7334
7335extern __inline __m256i
7338{
7340 (__v4di) __Y,
7341 (__v4di)
7343 (__mmask8) -1);
7344}
7345
7346extern __inline __m256i
7349 __m256i __Y)
7350{
7352 (__v4di) __Y,
7353 (__v4di) __W,
7354 (__mmask8) __U);
7355}
7356
7357extern __inline __m256i
7360{
7362 (__v4di) __Y,
7363 (__v4di)
7365 (__mmask8) __U);
7366}
7367
7368extern __inline __m256i
7371 __m256i __B)
7372{
7374 (__v4di) __B,
7375 (__v4di) __W, __U);
7376}
7377
7378extern __inline __m256i
7381{
7383 (__v4di) __B,
7384 (__v4di)
7386 __U);
7387}
7388
7389extern __inline __m128i
7392 __m128i __B)
7393{
7395 (__v2di) __B,
7396 (__v2di) __W, __U);
7397}
7398
7399extern __inline __m128i
7402{
7404 (__v2di) __B,
7405 (__v2di)
7406 _mm_setzero_pd (),
7407 __U);
7408}
7409
7410extern __inline __m256i
7413 __m256i __B)
7414{
7416 (__v4di) __B,
7417 (__v4di) __W, __U);
7418}
7419
7420extern __inline __m256i
7423{
7425 (__v4di) __B,
7426 (__v4di)
7428 __U);
7429}
7430
7431extern __inline __m128i
7434 __m128i __B)
7435{
7437 (__v2di) __B,
7438 (__v2di) __W, __U);
7439}
7440
7441extern __inline __m128i
7444{
7446 (__v2di) __B,
7447 (__v2di)
7448 _mm_setzero_pd (),
7449 __U);
7450}
7451
7452extern __inline __m256i
7455 __m256i __B)
7456{
7458 (__v4di) __B,
7459 (__v4di) __W,
7460 (__mmask8) __U);
7461}
7462
7463extern __inline __m256i
7466{
7468 (__v4di) __B,
7469 (__v4di)
7471 (__mmask8) __U);
7472}
7473
7476{
7477 return (__m256i) ((__v4du)__A | (__v4du)__B);
7478}
7479
7480extern __inline __m128i
7483{
7485 (__v2di) __B,
7486 (__v2di) __W,
7487 (__mmask8) __U);
7488}
7489
7490extern __inline __m128i
7493{
7495 (__v2di) __B,
7496 (__v2di)
7498 (__mmask8) __U);
7499}
7500
7503{
7504 return (__m128i) ((__v2du)__A | (__v2du)__B);
7505}
7506
7507extern __inline __m256i
7510 __m256i __B)
7511{
7513 (__v4di) __B,
7514 (__v4di) __W,
7515 (__mmask8) __U);
7516}
7517
7518extern __inline __m256i
7521{
7523 (__v4di) __B,
7524 (__v4di)
7526 (__mmask8) __U);
7527}
7528
7531{
7532 return (__m256i) ((__v4du)__A ^ (__v4du)__B);
7533}
7534
7535extern __inline __m128i
7538 __m128i __B)
7539{
7541 (__v2di) __B,
7542 (__v2di) __W,
7543 (__mmask8) __U);
7544}
7545
7546extern __inline __m128i
7549{
7551 (__v2di) __B,
7552 (__v2di)
7554 (__mmask8) __U);
7555}
7556
7559{
7560 return (__m128i) ((__v2du)__A ^ (__v2du)__B);
7561}
7562
7563extern __inline __m256d
7566 __m256d __B)
7567{
7569 (__v4df) __B,
7570 (__v4df) __W,
7571 (__mmask8) __U);
7572}
7573
7574extern __inline __m256d
7577{
7579 (__v4df) __B,
7580 (__v4df)
7582 (__mmask8) __U);
7583}
7584
7585extern __inline __m256
7588{
7590 (__v8sf) __B,
7591 (__v8sf) __W,
7592 (__mmask8) __U);
7593}
7594
7595extern __inline __m256
7598{
7600 (__v8sf) __B,
7601 (__v8sf)
7603 (__mmask8) __U);
7604}
7605
7606extern __inline __m128
7609{
7611 (__v4sf) __B,
7612 (__v4sf) __W,
7613 (__mmask8) __U);
7614}
7615
7616extern __inline __m128
7619{
7621 (__v4sf) __B,
7622 (__v4sf)
7623 _mm_setzero_ps (),
7624 (__mmask8) __U);
7625}
7626
7627extern __inline __m128d
7630{
7632 (__v2df) __B,
7633 (__v2df) __W,
7634 (__mmask8) __U);
7635}
7636
7637extern __inline __m128d
7640{
7642 (__v2df) __B,
7643 (__v2df)
7644 _mm_setzero_pd (),
7645 (__mmask8) __U);
7646}
7647
7648extern __inline __m256d
7651 __m256d __B)
7652{
7654 (__v4df) __B,
7655 (__v4df) __W,
7656 (__mmask8) __U);
7657}
7658
7659extern __inline __m256d
7662 __m256d __B)
7663{
7665 (__v4df) __B,
7666 (__v4df) __W,
7667 (__mmask8) __U);
7668}
7669
7670extern __inline __m256d
7673{
7675 (__v4df) __B,
7676 (__v4df)
7678 (__mmask8) __U);
7679}
7680
7681extern __inline __m256
7684{
7686 (__v8sf) __B,
7687 (__v8sf) __W,
7688 (__mmask8) __U);
7689}
7690
7691extern __inline __m256d
7694{
7696 (__v4df) __B,
7697 (__v4df)
7699 (__mmask8) __U);
7700}
7701
7702extern __inline __m256
7705{
7707 (__v8sf) __B,
7708 (__v8sf) __W,
7709 (__mmask8) __U);
7710}
7711
7712extern __inline __m256
7715{
7717 (__v8sf) __B,
7718 (__v8sf)
7720 (__mmask8) __U);
7721}
7722
7723extern __inline __m256
7726{
7728 (__v8sf) __B,
7729 (__v8sf)
7731 (__mmask8) __U);
7732}
7733
7734extern __inline __m128
7737{
7739 (__v4sf) __B,
7740 (__v4sf) __W,
7741 (__mmask8) __U);
7742}
7743
7744extern __inline __m128
7747{
7749 (__v4sf) __B,
7750 (__v4sf) __W,
7751 (__mmask8) __U);
7752}
7753
7754extern __inline __m128
7757{
7759 (__v4sf) __B,
7760 (__v4sf)
7761 _mm_setzero_ps (),
7762 (__mmask8) __U);
7763}
7764
7765extern __inline __m128
7768{
7770 (__v4sf) __B,
7771 (__v4sf)
7772 _mm_setzero_ps (),
7773 (__mmask8) __U);
7774}
7775
7776extern __inline __m128
7779{
7781 (__v4sf) __B,
7782 (__v4sf) __W,
7783 (__mmask8) __U);
7784}
7785
7786extern __inline __m128
7789{
7791 (__v4sf) __B,
7792 (__v4sf)
7793 _mm_setzero_ps (),
7794 (__mmask8) __U);
7795}
7796
7797extern __inline __m128d
7800{
7802 (__v2df) __B,
7803 (__v2df) __W,
7804 (__mmask8) __U);
7805}
7806
7807extern __inline __m128d
7810{
7812 (__v2df) __B,
7813 (__v2df)
7814 _mm_setzero_pd (),
7815 (__mmask8) __U);
7816}
7817
7818extern __inline __m128d
7821{
7823 (__v2df) __B,
7824 (__v2df) __W,
7825 (__mmask8) __U);
7826}
7827
7828extern __inline __m128d
7831{
7833 (__v2df) __B,
7834 (__v2df)
7835 _mm_setzero_pd (),
7836 (__mmask8) __U);
7837}
7838
7839extern __inline __m128d
7842{
7844 (__v2df) __B,
7845 (__v2df) __W,
7846 (__mmask8) __U);
7847}
7848
7849extern __inline __m128d
7852{
7854 (__v2df) __B,
7855 (__v2df)
7856 _mm_setzero_pd (),
7857 (__mmask8) __U);
7858}
7859
7860extern __inline __m256
7863{
7865 (__v8sf) __B,
7866 (__v8sf) __W,
7867 (__mmask8) __U);
7868}
7869
7870extern __inline __m256
7873{
7875 (__v8sf) __B,
7876 (__v8sf)
7878 (__mmask8) __U);
7879}
7880
7881extern __inline __m256d
7884 __m256d __B)
7885{
7887 (__v4df) __B,
7888 (__v4df) __W,
7889 (__mmask8) __U);
7890}
7891
7892extern __inline __m256d
7895{
7897 (__v4df) __B,
7898 (__v4df)
7900 (__mmask8) __U);
7901}
7902
7903extern __inline __m256i
7906{
7908 (__v4di) __B,
7909 (__v4di)
7911 __M);
7912}
7913
7914extern __inline __m256i
7917 __m256i __B)
7918{
7920 (__v4di) __B,
7921 (__v4di) __W, __M);
7922}
7923
7924extern __inline __m256i
7927{
7929 (__v4di) __B,
7930 (__v4di)
7932 (__mmask8) -1);
7933}
7934
7935extern __inline __m256i
7938 __m256i __B)
7939{
7941 (__v4di) __B,
7942 (__v4di) __W, __M);
7943}
7944
7945extern __inline __m256i
7948{
7950 (__v4di) __B,
7951 (__v4di)
7953 __M);
7954}
7955
7956extern __inline __m256i
7959{
7961 (__v4di) __B,
7962 (__v4di)
7964 __M);
7965}
7966
7967extern __inline __m256i
7970{
7972 (__v4di) __B,
7973 (__v4di)
7975 (__mmask8) -1);
7976}
7977
7978extern __inline __m256i
7981{
7983 (__v4di) __B,
7984 (__v4di)
7986 (__mmask8) -1);
7987}
7988
7989extern __inline __m256i
7992 __m256i __B)
7993{
7995 (__v4di) __B,
7996 (__v4di) __W, __M);
7997}
7998
7999extern __inline __m256i
8002{
8004 (__v4di) __B,
8005 (__v4di)
8007 (__mmask8) -1);
8008}
8009
8010extern __inline __m256i
8013 __m256i __B)
8014{
8016 (__v4di) __B,
8017 (__v4di) __W, __M);
8018}
8019
8020extern __inline __m256i
8023{
8025 (__v4di) __B,
8026 (__v4di)
8028 __M);
8029}
8030
8031extern __inline __m256i
8034{
8036 (__v8si) __B,
8037 (__v8si)
8039 __M);
8040}
8041
8042extern __inline __m256i
8045 __m256i __B)
8046{
8048 (__v8si) __B,
8049 (__v8si) __W, __M);
8050}
8051
8052extern __inline __m256i
8055{
8057 (__v8si) __B,
8058 (__v8si)
8060 __M);
8061}
8062
8063extern __inline __m256i
8066 __m256i __B)
8067{
8069 (__v8si) __B,
8070 (__v8si) __W, __M);
8071}
8072
8073extern __inline __m256i
8076{
8078 (__v8si) __B,
8079 (__v8si)
8081 __M);
8082}
8083
8084extern __inline __m256i
8087 __m256i __B)
8088{
8090 (__v8si) __B,
8091 (__v8si) __W, __M);
8092}
8093
8094extern __inline __m256i
8097{
8099 (__v8si) __B,
8100 (__v8si)
8102 __M);
8103}
8104
8105extern __inline __m256i
8108 __m256i __B)
8109{
8111 (__v8si) __B,
8112 (__v8si) __W, __M);
8113}
8114
8115extern __inline __m128i
8118{
8120 (__v2di) __B,
8121 (__v2di)
8123 __M);
8124}
8125
8126extern __inline __m128i
8129 __m128i __B)
8130{
8132 (__v2di) __B,
8133 (__v2di) __W, __M);
8134}
8135
8136extern __inline __m128i
8139{
8141 (__v2di) __B,
8142 (__v2di)
8144 (__mmask8) -1);
8145}
8146
8147extern __inline __m128i
8150 __m128i __B)
8151{
8153 (__v2di) __B,
8154 (__v2di) __W, __M);
8155}
8156
8157extern __inline __m128i
8160{
8162 (__v2di) __B,
8163 (__v2di)
8165 __M);
8166}
8167
8168extern __inline __m128i
8171{
8173 (__v2di) __B,
8174 (__v2di)
8176 __M);
8177}
8178
8179extern __inline __m128i
8182{
8184 (__v2di) __B,
8185 (__v2di)
8187 (__mmask8) -1);
8188}
8189
8190extern __inline __m128i
8193{
8195 (__v2di) __B,
8196 (__v2di)
8198 (__mmask8) -1);
8199}
8200
8201extern __inline __m128i
8204 __m128i __B)
8205{
8207 (__v2di) __B,
8208 (__v2di) __W, __M);
8209}
8210
8211extern __inline __m128i
8214{
8216 (__v2di) __B,
8217 (__v2di)
8219 (__mmask8) -1);
8220}
8221
8222extern __inline __m128i
8225 __m128i __B)
8226{
8228 (__v2di) __B,
8229 (__v2di) __W, __M);
8230}
8231
8232extern __inline __m128i
8235{
8237 (__v2di) __B,
8238 (__v2di)
8240 __M);
8241}
8242
8243extern __inline __m128i
8246{
8248 (__v4si) __B,
8249 (__v4si)
8251 __M);
8252}
8253
8254extern __inline __m128i
8257 __m128i __B)
8258{
8260 (__v4si) __B,
8261 (__v4si) __W, __M);
8262}
8263
8264extern __inline __m128i
8267{
8269 (__v4si) __B,
8270 (__v4si)
8272 __M);
8273}
8274
8275extern __inline __m128i
8278 __m128i __B)
8279{
8281 (__v4si) __B,
8282 (__v4si) __W, __M);
8283}
8284
8285extern __inline __m128i
8288{
8290 (__v4si) __B,
8291 (__v4si)
8293 __M);
8294}
8295
8296extern __inline __m128i
8299 __m128i __B)
8300{
8302 (__v4si) __B,
8303 (__v4si) __W, __M);
8304}
8305
8306extern __inline __m128i
8309{
8311 (__v4si) __B,
8312 (__v4si)
8314 __M);
8315}
8316
8317extern __inline __m128i
8320 __m128i __B)
8321{
8323 (__v4si) __B,
8324 (__v4si) __W, __M);
8325}
8326
8327#ifndef __AVX512CD__
8328#pragma GCC push_options
8329#pragma GCC target("avx512vl,avx512cd")
8330#define __DISABLE_AVX512VLCD__
8331#endif
8332
8333extern __inline __m128i
8336{
8338}
8339
8340extern __inline __m256i
8343{
8345}
8346
8347extern __inline __m128i
8350{
8352}
8353
8354extern __inline __m256i
8357{
8359}
8360
8361extern __inline __m256i
8364{
8366 (__v8si)
8368 (__mmask8) -1);
8369}
8370
8371extern __inline __m256i
8374{
8376 (__v8si) __W,
8377 (__mmask8) __U);
8378}
8379
8380extern __inline __m256i
8383{
8385 (__v8si)
8387 (__mmask8) __U);
8388}
8389
8390extern __inline __m256i
8393{
8395 (__v4di)
8397 (__mmask8) -1);
8398}
8399
8400extern __inline __m256i
8403{
8405 (__v4di) __W,
8406 (__mmask8) __U);
8407}
8408
8409extern __inline __m256i
8412{
8414 (__v4di)
8416 (__mmask8) __U);
8417}
8418
8419extern __inline __m256i
8422{
8424 (__v4di)
8426 (__mmask8) -1);
8427}
8428
8429extern __inline __m256i
8432{
8434 (__v4di) __W,
8435 (__mmask8)
8436 __U);
8437}
8438
8439extern __inline __m256i
8442{
8444 (__v4di)
8446 (__mmask8)
8447 __U);
8448}
8449
8450extern __inline __m256i
8453{
8455 (__v8si)
8457 (__mmask8) -1);
8458}
8459
8460extern __inline __m256i
8463{
8465 (__v8si) __W,
8466 (__mmask8)
8467 __U);
8468}
8469
8470extern __inline __m256i
8473{
8475 (__v8si)
8477 (__mmask8)
8478 __U);
8479}
8480
8481extern __inline __m128i
8484{
8486 (__v4si)
8488 (__mmask8) -1);
8489}
8490
8491extern __inline __m128i
8494{
8496 (__v4si) __W,
8497 (__mmask8) __U);
8498}
8499
8500extern __inline __m128i
8503{
8505 (__v4si)
8507 (__mmask8) __U);
8508}
8509
8510extern __inline __m128i
8513{
8515 (__v2di)
8517 (__mmask8) -1);
8518}
8519
8520extern __inline __m128i
8523{
8525 (__v2di) __W,
8526 (__mmask8) __U);
8527}
8528
8529extern __inline __m128i
8532{
8534 (__v2di)
8536 (__mmask8) __U);
8537}
8538
8539extern __inline __m128i
8542{
8544 (__v2di)
8546 (__mmask8) -1);
8547}
8548
8549extern __inline __m128i
8552{
8554 (__v2di) __W,
8555 (__mmask8)
8556 __U);
8557}
8558
8559extern __inline __m128i
8562{
8564 (__v2di)
8566 (__mmask8)
8567 __U);
8568}
8569
8570extern __inline __m128i
8573{
8575 (__v4si)
8577 (__mmask8) -1);
8578}
8579
8580extern __inline __m128i
8583{
8585 (__v4si) __W,
8586 (__mmask8)
8587 __U);
8588}
8589
8590extern __inline __m128i
8593{
8595 (__v4si)
8597 (__mmask8)
8598 __U);
8599}
8600
8601#ifdef __DISABLE_AVX512VLCD__
8602#pragma GCC pop_options
8603#endif
8604
8605extern __inline __m256d
8608 __m256d __B)
8609{
8611 (__v4df) __B,
8612 (__v4df) __W,
8613 (__mmask8) __U);
8614}
8615
8616extern __inline __m256d
8619{
8621 (__v4df) __B,
8622 (__v4df)
8624 (__mmask8) __U);
8625}
8626
8627extern __inline __m128d
8630 __m128d __B)
8631{
8633 (__v2df) __B,
8634 (__v2df) __W,
8635 (__mmask8) __U);
8636}
8637
8638extern __inline __m128d
8641{
8643 (__v2df) __B,
8644 (__v2df)
8645 _mm_setzero_pd (),
8646 (__mmask8) __U);
8647}
8648
8649extern __inline __m256
8652 __m256 __B)
8653{
8655 (__v8sf) __B,
8656 (__v8sf) __W,
8657 (__mmask8) __U);
8658}
8659
8660extern __inline __m256d
8663 __m256d __B)
8664{
8666 (__v4df) __B,
8667 (__v4df) __W,
8668 (__mmask8) __U);
8669}
8670
8671extern __inline __m256d
8674{
8676 (__v4df) __B,
8677 (__v4df)
8679 (__mmask8) __U);
8680}
8681
8682extern __inline __m128d
8685 __m128d __B)
8686{
8688 (__v2df) __B,
8689 (__v2df) __W,
8690 (__mmask8) __U);
8691}
8692
8693extern __inline __m128d
8696{
8698 (__v2df) __B,
8699 (__v2df)
8700 _mm_setzero_pd (),
8701 (__mmask8) __U);
8702}
8703
8704extern __inline __m256
8707 __m256 __B)
8708{
8710 (__v8sf) __B,
8711 (__v8sf) __W,
8712 (__mmask8) __U);
8713}
8714
8715extern __inline __m256
8718{
8720 (__v8sf) __B,
8721 (__v8sf)
8723 (__mmask8) __U);
8724}
8725
8726extern __inline __m128
8729{
8731 (__v4sf) __B,
8732 (__v4sf) __W,
8733 (__mmask8) __U);
8734}
8735
8736extern __inline __m128
8739{
8741 (__v4sf) __B,
8742 (__v4sf)
8743 _mm_setzero_ps (),
8744 (__mmask8) __U);
8745}
8746
8747extern __inline __m128
8750{
8752 (__v4sf) __W,
8753 (__mmask8) __U);
8754}
8755
8756extern __inline __m128
8759{
8761 (__v4sf)
8762 _mm_setzero_ps (),
8763 (__mmask8) __U);
8764}
8765
8766extern __inline __m256
8769{
8771 (__v8sf) __B,
8772 (__v8sf)
8774 (__mmask8) __U);
8775}
8776
8777extern __inline __m256
8780{
8782 (__v8sf) __W,
8783 (__mmask8) __U);
8784}
8785
8786extern __inline __m256
8789{
8791 (__v8sf)
8793 (__mmask8) __U);
8794}
8795
8796extern __inline __m128
8799{
8801 (__v4sf) __B,
8802 (__v4sf) __W,
8803 (__mmask8) __U);
8804}
8805
8806extern __inline __m128
8809{
8811 (__v4sf) __B,
8812 (__v4sf)
8813 _mm_setzero_ps (),
8814 (__mmask8) __U);
8815}
8816
8817extern __inline __m256i
8820 __m128i __B)
8821{
8823 (__v4si) __B,
8824 (__v8si) __W,
8825 (__mmask8) __U);
8826}
8827
8828extern __inline __m256i
8831{
8833 (__v4si) __B,
8834 (__v8si)
8836 (__mmask8) __U);
8837}
8838
8839extern __inline __m128i
8842 __m128i __B)
8843{
8845 (__v4si) __B,
8846 (__v4si) __W,
8847 (__mmask8) __U);
8848}
8849
8850extern __inline __m128i
8853{
8855 (__v4si) __B,
8856 (__v4si)
8858 (__mmask8) __U);
8859}
8860
8861extern __inline __m256i
8864{
8866 (__v2di) __B,
8867 (__v4di)
8869 (__mmask8) -1);
8870}
8871
8872extern __inline __m256i
8875 __m128i __B)
8876{
8878 (__v2di) __B,
8879 (__v4di) __W,
8880 (__mmask8) __U);
8881}
8882
8883extern __inline __m256i
8886{
8888 (__v2di) __B,
8889 (__v4di)
8891 (__mmask8) __U);
8892}
8893
8894extern __inline __m128i
8897{
8899 (__v2di) __B,
8900 (__v2di)
8902 (__mmask8) -1);
8903}
8904
8905extern __inline __m128i
8908 __m128i __B)
8909{
8911 (__v2di) __B,
8912 (__v2di) __W,
8913 (__mmask8) __U);
8914}
8915
8916extern __inline __m128i
8919{
8921 (__v2di) __B,
8922 (__v2di)
8924 (__mmask8) __U);
8925}
8926
8927extern __inline __m128i
8930 __m128i __B)
8931{
8933 (__v4si) __B,
8934 (__v4si) __W,
8935 (__mmask8) __U);
8936}
8937
8938extern __inline __m128i
8941{
8943 (__v4si) __B,
8944 (__v4si)
8946 (__mmask8) __U);
8947}
8948
8949extern __inline __m128i
8952 __m128i __B)
8953{
8955 (__v2di) __B,
8956 (__v2di) __W,
8957 (__mmask8) __U);
8958}
8959
8960extern __inline __m128i
8963{
8965 (__v2di) __B,
8966 (__v2di)
8968 (__mmask8) __U);
8969}
8970
8971extern __inline __m256i
8974 __m128i __B)
8975{
8977 (__v4si) __B,
8978 (__v8si) __W,
8979 (__mmask8) __U);
8980}
8981
8982extern __inline __m256i
8985{
8987 (__v4si) __B,
8988 (__v8si)
8990 (__mmask8) __U);
8991}
8992
8993extern __inline __m256i
8996 __m128i __B)
8997{
8999 (__v2di) __B,
9000 (__v4di) __W,
9001 (__mmask8) __U);
9002}
9003
9004extern __inline __m256i
9007{
9009 (__v2di) __B,
9010 (__v4di)
9012 (__mmask8) __U);
9013}
9014
9015extern __inline __m256
9018 __m256 __Y)
9019{
9021 (__v8si) __X,
9022 (__v8sf) __W,
9023 (__mmask8) __U);
9024}
9025
9026extern __inline __m256
9029{
9031 (__v8si) __X,
9032 (__v8sf)
9034 (__mmask8) __U);
9035}
9036
9037extern __inline __m256d
9040{
9042 (__v4di) __X,
9043 (__v4df)
9045 (__mmask8) -1);
9046}
9047
9048extern __inline __m256d
9051 __m256d __Y)
9052{
9054 (__v4di) __X,
9055 (__v4df) __W,
9056 (__mmask8) __U);
9057}
9058
9059extern __inline __m256d
9062{
9064 (__v4di) __X,
9065 (__v4df)
9067 (__mmask8) __U);
9068}
9069
9070extern __inline __m256d
9073 __m256i __C)
9074{
9076 (__v4di) __C,
9077 (__v4df) __W,
9078 (__mmask8)
9079 __U);
9080}
9081
9082extern __inline __m256d
9085{
9087 (__v4di) __C,
9088 (__v4df)
9090 (__mmask8)
9091 __U);
9092}
9093
9094extern __inline __m256
9097 __m256i __C)
9098{
9100 (__v8si) __C,
9101 (__v8sf) __W,
9102 (__mmask8) __U);
9103}
9104
9105extern __inline __m256
9108{
9110 (__v8si) __C,
9111 (__v8sf)
9113 (__mmask8) __U);
9114}
9115
9116extern __inline __m128d
9119 __m128i __C)
9120{
9122 (__v2di) __C,
9123 (__v2df) __W,
9124 (__mmask8) __U);
9125}
9126
9127extern __inline __m128d
9130{
9132 (__v2di) __C,
9133 (__v2df)
9134 _mm_setzero_pd (),
9135 (__mmask8) __U);
9136}
9137
9138extern __inline __m128
9141 __m128i __C)
9142{
9144 (__v4si) __C,
9145 (__v4sf) __W,
9146 (__mmask8) __U);
9147}
9148
9149extern __inline __m128
9152{
9154 (__v4si) __C,
9155 (__v4sf)
9156 _mm_setzero_ps (),
9157 (__mmask8) __U);
9158}
9159
9160extern __inline __m256i
9163{
9165 (__v8si) __B,
9166 (__v8si)
9168 __M);
9169}
9170
9171extern __inline __m256i
9174{
9176 (__v4di) __X,
9177 (__v4di)
9179 __M);
9180}
9181
9182extern __inline __m256i
9185 __m256i __B)
9186{
9188 (__v8si) __B,
9189 (__v8si) __W, __M);
9190}
9191
9192extern __inline __m128i
9195{
9197 (__v4si) __B,
9198 (__v4si)
9200 __M);
9201}
9202
9203extern __inline __m128i
9206 __m128i __B)
9207{
9209 (__v4si) __B,
9210 (__v4si) __W, __M);
9211}
9212
9213extern __inline __m256i
9216 __m256i __Y)
9217{
9219 (__v8si) __Y,
9220 (__v4di) __W, __M);
9221}
9222
9223extern __inline __m256i
9226{
9228 (__v8si) __Y,
9229 (__v4di)
9231 __M);
9232}
9233
9234extern __inline __m128i
9237 __m128i __Y)
9238{
9240 (__v4si) __Y,
9241 (__v2di) __W, __M);
9242}
9243
9244extern __inline __m128i
9247{
9249 (__v4si) __Y,
9250 (__v2di)
9252 __M);
9253}
9254
9255extern __inline __m256i
9258{
9260 (__v4di) __X,
9261 (__v4di)
9263 (__mmask8) -1);
9264}
9265
9266extern __inline __m256i
9269 __m256i __Y)
9270{
9272 (__v4di) __X,
9273 (__v4di) __W,
9274 __M);
9275}
9276
9277extern __inline __m256i
9280 __m256i __Y)
9281{
9283 (__v8si) __Y,
9284 (__v4di) __W, __M);
9285}
9286
9287extern __inline __m256i
9290{
9292 (__v8si) __X,
9293 (__v8si)
9295 __M);
9296}
9297
9298extern __inline __m256i
9301{
9303 (__v8si) __Y,
9304 (__v4di)
9306 __M);
9307}
9308
9309extern __inline __m128i
9312 __m128i __Y)
9313{
9315 (__v4si) __Y,
9316 (__v2di) __W, __M);
9317}
9318
9319extern __inline __m128i
9322{
9324 (__v4si) __Y,
9325 (__v2di)
9327 __M);
9328}
9329
9330extern __inline __m256i
9333{
9335 (__v8si) __X,
9336 (__v8si)
9338 (__mmask8) -1);
9339}
9340
9341extern __inline __m256i
9344 __m256i __Y)
9345{
9347 (__v8si) __X,
9348 (__v8si) __W,
9349 __M);
9350}
9351
9352extern __inline __mmask8
9355{
9357 (__v8si) __Y, 4,
9358 (__mmask8) __M);
9359}
9360
9361extern __inline __mmask8
9364{
9366 (__v8si) __Y, 4,
9367 (__mmask8) -1);
9368}
9369
9370extern __inline __mmask8
9373{
9375 (__v8si) __Y, 1,
9376 (__mmask8) __M);
9377}
9378
9379extern __inline __mmask8
9382{
9384 (__v8si) __Y, 1,
9385 (__mmask8) -1);
9386}
9387
9388extern __inline __mmask8
9391{
9393 (__v8si) __Y, 5,
9394 (__mmask8) __M);
9395}
9396
9397extern __inline __mmask8
9400{
9402 (__v8si) __Y, 5,
9403 (__mmask8) -1);
9404}
9405
9406extern __inline __mmask8
9409{
9411 (__v8si) __Y, 2,
9412 (__mmask8) __M);
9413}
9414
9415extern __inline __mmask8
9418{
9420 (__v8si) __Y, 2,
9421 (__mmask8) -1);
9422}
9423
9424extern __inline __mmask8
9427{
9429 (__v4di) __Y, 4,
9430 (__mmask8) __M);
9431}
9432
9433extern __inline __mmask8
9436{
9438 (__v4di) __Y, 4,
9439 (__mmask8) -1);
9440}
9441
9442extern __inline __mmask8
9445{
9447 (__v4di) __Y, 1,
9448 (__mmask8) __M);
9449}
9450
9451extern __inline __mmask8
9454{
9456 (__v4di) __Y, 1,
9457 (__mmask8) -1);
9458}
9459
9460extern __inline __mmask8
9463{
9465 (__v4di) __Y, 5,
9466 (__mmask8) __M);
9467}
9468
9469extern __inline __mmask8
9472{
9474 (__v4di) __Y, 5,
9475 (__mmask8) -1);
9476}
9477
9478extern __inline __mmask8
9481{
9483 (__v4di) __Y, 2,
9484 (__mmask8) __M);
9485}
9486
9487extern __inline __mmask8
9490{
9492 (__v4di) __Y, 2,
9493 (__mmask8) -1);
9494}
9495
9496extern __inline __mmask8
9499{
9501 (__v8si) __Y, 4,
9502 (__mmask8) __M);
9503}
9504
9505extern __inline __mmask8
9508{
9510 (__v8si) __Y, 4,
9511 (__mmask8) -1);
9512}
9513
9514extern __inline __mmask8
9517{
9519 (__v8si) __Y, 1,
9520 (__mmask8) __M);
9521}
9522
9523extern __inline __mmask8
9526{
9528 (__v8si) __Y, 1,
9529 (__mmask8) -1);
9530}
9531
9532extern __inline __mmask8
9535{
9537 (__v8si) __Y, 5,
9538 (__mmask8) __M);
9539}
9540
9541extern __inline __mmask8
9544{
9546 (__v8si) __Y, 5,
9547 (__mmask8) -1);
9548}
9549
9550extern __inline __mmask8
9553{
9555 (__v8si) __Y, 2,
9556 (__mmask8) __M);
9557}
9558
9559extern __inline __mmask8
9562{
9564 (__v8si) __Y, 2,
9565 (__mmask8) -1);
9566}
9567
9568extern __inline __mmask8
9571{
9573 (__v4di) __Y, 4,
9574 (__mmask8) __M);
9575}
9576
9577extern __inline __mmask8
9580{
9582 (__v4di) __Y, 4,
9583 (__mmask8) -1);
9584}
9585
9586extern __inline __mmask8
9589{
9591 (__v4di) __Y, 1,
9592 (__mmask8) __M);
9593}
9594
9595extern __inline __mmask8
9598{
9600 (__v4di) __Y, 1,
9601 (__mmask8) -1);
9602}
9603
9604extern __inline __mmask8
9607{
9609 (__v4di) __Y, 5,
9610 (__mmask8) __M);
9611}
9612
9613extern __inline __mmask8
9616{
9618 (__v4di) __Y, 5,
9619 (__mmask8) -1);
9620}
9621
9622extern __inline __mmask8
9625{
9627 (__v4di) __Y, 2,
9628 (__mmask8) __M);
9629}
9630
9631extern __inline __mmask8
9634{
9636 (__v4di) __Y, 2,
9637 (__mmask8) -1);
9638}
9639
9640extern __inline __mmask8
9643{
9645 (__v4si) __Y, 4,
9646 (__mmask8) __M);
9647}
9648
9649extern __inline __mmask8
9652{
9654 (__v4si) __Y, 4,
9655 (__mmask8) -1);
9656}
9657
9658extern __inline __mmask8
9661{
9663 (__v4si) __Y, 1,
9664 (__mmask8) __M);
9665}
9666
9667extern __inline __mmask8
9670{
9672 (__v4si) __Y, 1,
9673 (__mmask8) -1);
9674}
9675
9676extern __inline __mmask8
9679{
9681 (__v4si) __Y, 5,
9682 (__mmask8) __M);
9683}
9684
9685extern __inline __mmask8
9688{
9690 (__v4si) __Y, 5,
9691 (__mmask8) -1);
9692}
9693
9694extern __inline __mmask8
9697{
9699 (__v4si) __Y, 2,
9700 (__mmask8) __M);
9701}
9702
9703extern __inline __mmask8
9706{
9708 (__v4si) __Y, 2,
9709 (__mmask8) -1);
9710}
9711
9712extern __inline __mmask8
9715{
9717 (__v2di) __Y, 4,
9718 (__mmask8) __M);
9719}
9720
9721extern __inline __mmask8
9724{
9726 (__v2di) __Y, 4,
9727 (__mmask8) -1);
9728}
9729
9730extern __inline __mmask8
9733{
9735 (__v2di) __Y, 1,
9736 (__mmask8) __M);
9737}
9738
9739extern __inline __mmask8
9742{
9744 (__v2di) __Y, 1,
9745 (__mmask8) -1);
9746}
9747
9748extern __inline __mmask8
9751{
9753 (__v2di) __Y, 5,
9754 (__mmask8) __M);
9755}
9756
9757extern __inline __mmask8
9760{
9762 (__v2di) __Y, 5,
9763 (__mmask8) -1);
9764}
9765
9766extern __inline __mmask8
9769{
9771 (__v2di) __Y, 2,
9772 (__mmask8) __M);
9773}
9774
9775extern __inline __mmask8
9778{
9780 (__v2di) __Y, 2,
9781 (__mmask8) -1);
9782}
9783
9784extern __inline __mmask8
9787{
9789 (__v4si) __Y, 4,
9790 (__mmask8) __M);
9791}
9792
9793extern __inline __mmask8
9796{
9798 (__v4si) __Y, 4,
9799 (__mmask8) -1);
9800}
9801
9802extern __inline __mmask8
9805{
9807 (__v4si) __Y, 1,
9808 (__mmask8) __M);
9809}
9810
9811extern __inline __mmask8
9814{
9816 (__v4si) __Y, 1,
9817 (__mmask8) -1);
9818}
9819
9820extern __inline __mmask8
9823{
9825 (__v4si) __Y, 5,
9826 (__mmask8) __M);
9827}
9828
9829extern __inline __mmask8
9832{
9834 (__v4si) __Y, 5,
9835 (__mmask8) -1);
9836}
9837
9838extern __inline __mmask8
9841{
9843 (__v4si) __Y, 2,
9844 (__mmask8) __M);
9845}
9846
9847extern __inline __mmask8
9850{
9852 (__v4si) __Y, 2,
9853 (__mmask8) -1);
9854}
9855
9856extern __inline __mmask8
9859{
9861 (__v2di) __Y, 4,
9862 (__mmask8) __M);
9863}
9864
9865extern __inline __mmask8
9868{
9870 (__v2di) __Y, 4,
9871 (__mmask8) -1);
9872}
9873
9874extern __inline __mmask8
9877{
9879 (__v2di) __Y, 1,
9880 (__mmask8) __M);
9881}
9882
9883extern __inline __mmask8
9886{
9888 (__v2di) __Y, 1,
9889 (__mmask8) -1);
9890}
9891
9892extern __inline __mmask8
9895{
9897 (__v2di) __Y, 5,
9898 (__mmask8) __M);
9899}
9900
9901extern __inline __mmask8
9904{
9906 (__v2di) __Y, 5,
9907 (__mmask8) -1);
9908}
9909
9910extern __inline __mmask8
9913{
9915 (__v2di) __Y, 2,
9916 (__mmask8) __M);
9917}
9918
9919extern __inline __mmask8
9922{
9924 (__v2di) __Y, 2,
9925 (__mmask8) -1);
9926}
9927
9928#ifdef __OPTIMIZE__
9929extern __inline __m256i
9932{
9934 __I,
9935 (__v4di)
9937 (__mmask8) -1);
9938}
9939
9940extern __inline __m256i
9943 __m256i __X, const int __I)
9944{
9946 __I,
9947 (__v4di) __W,
9948 (__mmask8) __M);
9949}
9950
9951extern __inline __m256i
9954{
9956 __I,
9957 (__v4di)
9959 (__mmask8) __M);
9960}
9961
9962extern __inline __m256d
9965 __m256d __B, const int __imm)
9966{
9968 (__v4df) __B, __imm,
9969 (__v4df) __W,
9970 (__mmask8) __U);
9971}
9972
9973extern __inline __m256d
9976 const int __imm)
9977{
9979 (__v4df) __B, __imm,
9980 (__v4df)
9982 (__mmask8) __U);
9983}
9984
9985extern __inline __m128d
9988 __m128d __B, const int __imm)
9989{
9991 (__v2df) __B, __imm,
9992 (__v2df) __W,
9993 (__mmask8) __U);
9994}
9995
9996extern __inline __m128d
9999 const int __imm)
10000{
10002 (__v2df) __B, __imm,
10003 (__v2df)
10004 _mm_setzero_pd (),
10005 (__mmask8) __U);
10006}
10007
10008extern __inline __m256
10011 __m256 __B, const int __imm)
10012{
10014 (__v8sf) __B, __imm,
10015 (__v8sf) __W,
10016 (__mmask8) __U);
10017}
10018
10019extern __inline __m256
10022 const int __imm)
10023{
10025 (__v8sf) __B, __imm,
10026 (__v8sf)
10028 (__mmask8) __U);
10029}
10030
10031extern __inline __m128
10034 const int __imm)
10035{
10037 (__v4sf) __B, __imm,
10038 (__v4sf) __W,
10039 (__mmask8) __U);
10040}
10041
10042extern __inline __m128
10045 const int __imm)
10046{
10048 (__v4sf) __B, __imm,
10049 (__v4sf)
10050 _mm_setzero_ps (),
10051 (__mmask8) __U);
10052}
10053
10054extern __inline __m256i
10057{
10059 (__v4si) __B,
10060 __imm,
10061 (__v8si)
10063 (__mmask8) -1);
10064}
10065
10066extern __inline __m256i
10069 __m128i __B, const int __imm)
10070{
10072 (__v4si) __B,
10073 __imm,
10074 (__v8si) __W,
10075 (__mmask8)
10076 __U);
10077}
10078
10079extern __inline __m256i
10082 const int __imm)
10083{
10085 (__v4si) __B,
10086 __imm,
10087 (__v8si)
10089 (__mmask8)
10090 __U);
10091}
10092
10093extern __inline __m256
10096{
10098 (__v4sf) __B,
10099 __imm,
10100 (__v8sf)
10102 (__mmask8) -1);
10103}
10104
10105extern __inline __m256
10108 __m128 __B, const int __imm)
10109{
10111 (__v4sf) __B,
10112 __imm,
10113 (__v8sf) __W,
10114 (__mmask8) __U);
10115}
10116
10117extern __inline __m256
10120 const int __imm)
10121{
10123 (__v4sf) __B,
10124 __imm,
10125 (__v8sf)
10127 (__mmask8) __U);
10128}
10129
10130extern __inline __m128i
10133{
10135 __imm,
10136 (__v4si)
10138 (__mmask8) -1);
10139}
10140
10141extern __inline __m128i
10144 const int __imm)
10145{
10147 __imm,
10148 (__v4si) __W,
10149 (__mmask8)
10150 __U);
10151}
10152
10153extern __inline __m128i
10156 const int __imm)
10157{
10159 __imm,
10160 (__v4si)
10162 (__mmask8)
10163 __U);
10164}
10165
10166extern __inline __m128
10169{
10171 __imm,
10172 (__v4sf)
10173 _mm_setzero_ps (),
10174 (__mmask8) -1);
10175}
10176
10177extern __inline __m128
10180 const int __imm)
10181{
10183 __imm,
10184 (__v4sf) __W,
10185 (__mmask8)
10186 __U);
10187}
10188
10189extern __inline __m128
10192 const int __imm)
10193{
10195 __imm,
10196 (__v4sf)
10197 _mm_setzero_ps (),
10198 (__mmask8)
10199 __U);
10200}
10201
10202extern __inline __m256i
10205{
10207 (__v4di) __B,
10208 __imm,
10209 (__v4di)
10211 (__mmask8) -1);
10212}
10213
10214extern __inline __m256i
10217 __m256i __B, const int __imm)
10218{
10220 (__v4di) __B,
10221 __imm,
10222 (__v4di) __W,
10223 (__mmask8) __U);
10224}
10225
10226extern __inline __m256i
10229 const int __imm)
10230{
10232 (__v4di) __B,
10233 __imm,
10234 (__v4di)
10236 (__mmask8) __U);
10237}
10238
10239extern __inline __m256i
10242{
10244 (__v8si) __B,
10245 __imm,
10246 (__v8si)
10248 (__mmask8) -1);
10249}
10250
10251extern __inline __m256i
10254 __m256i __B, const int __imm)
10255{
10257 (__v8si) __B,
10258 __imm,
10259 (__v8si) __W,
10260 (__mmask8) __U);
10261}
10262
10263extern __inline __m256i
10266 const int __imm)
10267{
10269 (__v8si) __B,
10270 __imm,
10271 (__v8si)
10273 (__mmask8) __U);
10274}
10275
10276extern __inline __m256d
10279{
10281 (__v4df) __B,
10282 __imm,
10283 (__v4df)
10285 (__mmask8) -1);
10286}
10287
10288extern __inline __m256d
10291 __m256d __B, const int __imm)
10292{
10294 (__v4df) __B,
10295 __imm,
10296 (__v4df) __W,
10297 (__mmask8) __U);
10298}
10299
10300extern __inline __m256d
10303 const int __imm)
10304{
10306 (__v4df) __B,
10307 __imm,
10308 (__v4df)
10310 (__mmask8) __U);
10311}
10312
10313extern __inline __m256
10316{
10318 (__v8sf) __B,
10319 __imm,
10320 (__v8sf)
10322 (__mmask8) -1);
10323}
10324
10325extern __inline __m256
10328 __m256 __B, const int __imm)
10329{
10331 (__v8sf) __B,
10332 __imm,
10333 (__v8sf) __W,
10334 (__mmask8) __U);
10335}
10336
10337extern __inline __m256
10340 const int __imm)
10341{
10343 (__v8sf) __B,
10344 __imm,
10345 (__v8sf)
10347 (__mmask8) __U);
10348}
10349
10350extern __inline __m256d
10353 const int __imm)
10354{
10356 (__v4df) __B,
10357 (__v4di) __C,
10358 __imm,
10359 (__mmask8) -1);
10360}
10361
10362extern __inline __m256d
10365 __m256i __C, const int __imm)
10366{
10368 (__v4df) __B,
10369 (__v4di) __C,
10370 __imm,
10371 (__mmask8) __U);
10372}
10373
10374extern __inline __m256d
10377 __m256i __C, const int __imm)
10378{
10380 (__v4df) __B,
10381 (__v4di) __C,
10382 __imm,
10383 (__mmask8) __U);
10384}
10385
10386extern __inline __m256
10389 const int __imm)
10390{
10392 (__v8sf) __B,
10393 (__v8si) __C,
10394 __imm,
10395 (__mmask8) -1);
10396}
10397
10398extern __inline __m256
10401 __m256i __C, const int __imm)
10402{
10404 (__v8sf) __B,
10405 (__v8si) __C,
10406 __imm,
10407 (__mmask8) __U);
10408}
10409
10410extern __inline __m256
10413 __m256i __C, const int __imm)
10414{
10416 (__v8sf) __B,
10417 (__v8si) __C,
10418 __imm,
10419 (__mmask8) __U);
10420}
10421
10422extern __inline __m128d
10425 const int __imm)
10426{
10428 (__v2df) __B,
10429 (__v2di) __C,
10430 __imm,
10431 (__mmask8) -1);
10432}
10433
10434extern __inline __m128d
10437 __m128i __C, const int __imm)
10438{
10440 (__v2df) __B,
10441 (__v2di) __C,
10442 __imm,
10443 (__mmask8) __U);
10444}
10445
10446extern __inline __m128d
10449 __m128i __C, const int __imm)
10450{
10452 (__v2df) __B,
10453 (__v2di) __C,
10454 __imm,
10455 (__mmask8) __U);
10456}
10457
10458extern __inline __m128
10461{
10463 (__v4sf) __B,
10464 (__v4si) __C,
10465 __imm,
10466 (__mmask8) -1);
10467}
10468
10469extern __inline __m128
10472 __m128i __C, const int __imm)
10473{
10475 (__v4sf) __B,
10476 (__v4si) __C,
10477 __imm,
10478 (__mmask8) __U);
10479}
10480
10481extern __inline __m128
10484 __m128i __C, const int __imm)
10485{
10487 (__v4sf) __B,
10488 (__v4si) __C,
10489 __imm,
10490 (__mmask8) __U);
10491}
10492
10493extern __inline __m256i
10496 const int __imm)
10497{
10499 (__v8si) __W,
10500 (__mmask8) __U);
10501}
10502
10503extern __inline __m256i
10506{
10508 (__v8si)
10510 (__mmask8) __U);
10511}
10512
10513extern __inline __m128i
10516 const int __imm)
10517{
10519 (__v4si) __W,
10520 (__mmask8) __U);
10521}
10522
10523extern __inline __m128i
10526{
10528 (__v4si)
10530 (__mmask8) __U);
10531}
10532
10533extern __inline __m256i
10536 const int __imm)
10537{
10539 (__v4di) __W,
10540 (__mmask8) __U);
10541}
10542
10543extern __inline __m256i
10546{
10548 (__v4di)
10550 (__mmask8) __U);
10551}
10552
10553extern __inline __m128i
10556 const int __imm)
10557{
10559 (__v2di) __W,
10560 (__mmask8) __U);
10561}
10562
10563extern __inline __m128i
10566{
10568 (__v2di)
10570 (__mmask8) __U);
10571}
10572
10573extern __inline __m256i
10576 const int __imm)
10577{
10578 return (__m256i)
10580 (__v4di) __B,
10581 (__v4di) __C,
10582 (unsigned char) __imm,
10583 (__mmask8) -1);
10584}
10585
10586extern __inline __m256i
10590 const int __imm)
10591{
10592 return (__m256i)
10594 (__v4di) __B,
10595 (__v4di) __C,
10596 (unsigned char) __imm,
10597 (__mmask8) __U);
10598}
10599
10600extern __inline __m256i
10604 const int __imm)
10605{
10606 return (__m256i)
10608 (__v4di) __B,
10609 (__v4di) __C,
10610 (unsigned char) __imm,
10611 (__mmask8) __U);
10612}
10613
10614extern __inline __m256i
10617 const int __imm)
10618{
10619 return (__m256i)
10621 (__v8si) __B,
10622 (__v8si) __C,
10623 (unsigned char) __imm,
10624 (__mmask8) -1);
10625}
10626
10627extern __inline __m256i
10631 const int __imm)
10632{
10633 return (__m256i)
10635 (__v8si) __B,
10636 (__v8si) __C,
10637 (unsigned char) __imm,
10638 (__mmask8) __U);
10639}
10640
10641extern __inline __m256i
10645 const int __imm)
10646{
10647 return (__m256i)
10649 (__v8si) __B,
10650 (__v8si) __C,
10651 (unsigned char) __imm,
10652 (__mmask8) __U);
10653}
10654
10655extern __inline __m128i
10658 const int __imm)
10659{
10660 return (__m128i)
10662 (__v2di) __B,
10663 (__v2di) __C,
10664 (unsigned char) __imm,
10665 (__mmask8) -1);
10666}
10667
10668extern __inline __m128i
10672 const int __imm)
10673{
10674 return (__m128i)
10676 (__v2di) __B,
10677 (__v2di) __C,
10678 (unsigned char) __imm,
10679 (__mmask8) __U);
10680}
10681
10682extern __inline __m128i
10686 const int __imm)
10687{
10688 return (__m128i)
10690 (__v2di) __B,
10691 (__v2di) __C,
10692 (unsigned char) __imm,
10693 (__mmask8) __U);
10694}
10695
10696extern __inline __m128i
10699 const int __imm)
10700{
10701 return (__m128i)
10703 (__v4si) __B,
10704 (__v4si) __C,
10705 (unsigned char) __imm,
10706 (__mmask8) -1);
10707}
10708
10709extern __inline __m128i
10713 const int __imm)
10714{
10715 return (__m128i)
10717 (__v4si) __B,
10718 (__v4si) __C,
10719 (unsigned char) __imm,
10720 (__mmask8) __U);
10721}
10722
10723extern __inline __m128i
10727 const int __imm)
10728{
10729 return (__m128i)
10731 (__v4si) __B,
10732 (__v4si) __C,
10733 (unsigned char) __imm,
10734 (__mmask8) __U);
10735}
10736
10737extern __inline __m256
10740{
10742 __imm,
10743 (__v8sf)
10745 (__mmask8) -1);
10746}
10747
10748extern __inline __m256
10751 const int __imm)
10752{
10754 __imm,
10755 (__v8sf) __W,
10756 (__mmask8) __U);
10757}
10758
10759extern __inline __m256
10762{
10764 __imm,
10765 (__v8sf)
10767 (__mmask8) __U);
10768}
10769
10770extern __inline __m256d
10773{
10775 __imm,
10776 (__v4df)
10778 (__mmask8) -1);
10779}
10780
10781extern __inline __m256d
10784 const int __imm)
10785{
10787 __imm,
10788 (__v4df) __W,
10789 (__mmask8) __U);
10790}
10791
10792extern __inline __m256d
10795{
10797 __imm,
10798 (__v4df)
10800 (__mmask8) __U);
10801}
10802
10803extern __inline __m128
10805_mm_roundscale_ps (__m128 __A, const int __imm)
10806{
10808 __imm,
10809 (__v4sf)
10810 _mm_setzero_ps (),
10811 (__mmask8) -1);
10812}
10813
10814extern __inline __m128
10817 const int __imm)
10818{
10820 __imm,
10821 (__v4sf) __W,
10822 (__mmask8) __U);
10823}
10824
10825extern __inline __m128
10828{
10830 __imm,
10831 (__v4sf)
10832 _mm_setzero_ps (),
10833 (__mmask8) __U);
10834}
10835
10836extern __inline __m128d
10839{
10841 __imm,
10842 (__v2df)
10843 _mm_setzero_pd (),
10844 (__mmask8) -1);
10845}
10846
10847extern __inline __m128d
10850 const int __imm)
10851{
10853 __imm,
10854 (__v2df) __W,
10855 (__mmask8) __U);
10856}
10857
10858extern __inline __m128d
10861{
10863 __imm,
10864 (__v2df)
10865 _mm_setzero_pd (),
10866 (__mmask8) __U);
10867}
10868
10869extern __inline __m256
10873{
10875 (__C << 2) | __B,
10876 (__v8sf)
10878 (__mmask8) -1);
10879}
10880
10881extern __inline __m256
10886{
10888 (__C << 2) | __B,
10889 (__v8sf) __W,
10890 (__mmask8) __U);
10891}
10892
10893extern __inline __m256
10898{
10900 (__C << 2) | __B,
10901 (__v8sf)
10903 (__mmask8) __U);
10904}
10905
10906extern __inline __m128
10910{
10912 (__C << 2) | __B,
10913 (__v4sf)
10914 _mm_setzero_ps (),
10915 (__mmask8) -1);
10916}
10917
10918extern __inline __m128
10923{
10925 (__C << 2) | __B,
10926 (__v4sf) __W,
10927 (__mmask8) __U);
10928}
10929
10930extern __inline __m128
10935{
10937 (__C << 2) | __B,
10938 (__v4sf)
10939 _mm_setzero_ps (),
10940 (__mmask8) __U);
10941}
10942
10943extern __inline __m256d
10947{
10949 (__C << 2) | __B,
10950 (__v4df)
10952 (__mmask8) -1);
10953}
10954
10955extern __inline __m256d
10960{
10962 (__C << 2) | __B,
10963 (__v4df) __W,
10964 (__mmask8) __U);
10965}
10966
10967extern __inline __m256d
10972{
10974 (__C << 2) | __B,
10975 (__v4df)
10977 (__mmask8) __U);
10978}
10979
10980extern __inline __m128d
10984{
10986 (__C << 2) | __B,
10987 (__v2df)
10988 _mm_setzero_pd (),
10989 (__mmask8) -1);
10990}
10991
10992extern __inline __m128d
10997{
10999 (__C << 2) | __B,
11000 (__v2df) __W,
11001 (__mmask8) __U);
11002}
11003
11004extern __inline __m128d
11009{
11011 (__C << 2) | __B,
11012 (__v2df)
11013 _mm_setzero_pd (),
11014 (__mmask8) __U);
11015}
11016
11017extern __inline __m256
11020 __m256i __index, void const *__addr,
11021 int __scale)
11022{
11024 __addr,
11025 (__v8si) __index,
11026 __mask, __scale);
11027}
11028
11029extern __inline __m128
11032 __m128i __index, void const *__addr,
11033 int __scale)
11034{
11036 __addr,
11037 (__v4si) __index,
11038 __mask, __scale);
11039}
11040
11041extern __inline __m256d
11044 __m128i __index, void const *__addr,
11045 int __scale)
11046{
11048 __addr,
11049 (__v4si) __index,
11050 __mask, __scale);
11051}
11052
11053extern __inline __m128d
11056 __m128i __index, void const *__addr,
11057 int __scale)
11058{
11060 __addr,
11061 (__v4si) __index,
11062 __mask, __scale);
11063}
11064
11065extern __inline __m128
11068 __m256i __index, void const *__addr,
11069 int __scale)
11070{
11072 __addr,
11073 (__v4di) __index,
11074 __mask, __scale);
11075}
11076
11077extern __inline __m128
11080 __m128i __index, void const *__addr,
11081 int __scale)
11082{
11084 __addr,
11085 (__v2di) __index,
11086 __mask, __scale);
11087}
11088
11089extern __inline __m256d
11092 __m256i __index, void const *__addr,
11093 int __scale)
11094{
11096 __addr,
11097 (__v4di) __index,
11098 __mask, __scale);
11099}
11100
11101extern __inline __m128d
11104 __m128i __index, void const *__addr,
11105 int __scale)
11106{
11108 __addr,
11109 (__v2di) __index,
11110 __mask, __scale);
11111}
11112
11113extern __inline __m256i
11116 __m256i __index, void const *__addr,
11117 int __scale)
11118{
11120 __addr,
11121 (__v8si) __index,
11122 __mask, __scale);
11123}
11124
11125extern __inline __m128i
11128 __m128i __index, void const *__addr,
11129 int __scale)
11130{
11132 __addr,
11133 (__v4si) __index,
11134 __mask, __scale);
11135}
11136
11137extern __inline __m256i
11140 __m128i __index, void const *__addr,
11141 int __scale)
11142{
11144 __addr,
11145 (__v4si) __index,
11146 __mask, __scale);
11147}
11148
11149extern __inline __m128i
11152 __m128i __index, void const *__addr,
11153 int __scale)
11154{
11156 __addr,
11157 (__v4si) __index,
11158 __mask, __scale);
11159}
11160
11161extern __inline __m128i
11164 __m256i __index, void const *__addr,
11165 int __scale)
11166{
11168 __addr,
11169 (__v4di) __index,
11170 __mask, __scale);
11171}
11172
11173extern __inline __m128i
11176 __m128i __index, void const *__addr,
11177 int __scale)
11178{
11180 __addr,
11181 (__v2di) __index,
11182 __mask, __scale);
11183}
11184
11185extern __inline __m256i
11188 __m256i __index, void const *__addr,
11189 int __scale)
11190{
11192 __addr,
11193 (__v4di) __index,
11194 __mask, __scale);
11195}
11196
11197extern __inline __m128i
11200 __m128i __index, void const *__addr,
11201 int __scale)
11202{
11204 __addr,
11205 (__v2di) __index,
11206 __mask, __scale);
11207}
11208
11209extern __inline void
11212 __m256 __v1, const int __scale)
11213{
11216 __scale);
11217}
11218
11219extern __inline void
11223 const int __scale)
11224{
11226 (__v8sf) __v1, __scale);
11227}
11228
11229extern __inline void
11232 const int __scale)
11233{
11236 __scale);
11237}
11238
11239extern __inline void
11243 const int __scale)
11244{
11246 (__v4sf) __v1, __scale);
11247}
11248
11249extern __inline void
11252 __m256d __v1, const int __scale)
11253{
11256 __scale);
11257}
11258
11259extern __inline void
11263 const int __scale)
11264{
11266 (__v4df) __v1, __scale);
11267}
11268
11269extern __inline void
11272 __m128d __v1, const int __scale)
11273{
11276 __scale);
11277}
11278
11279extern __inline void
11283 const int __scale)
11284{
11286 (__v2df) __v1, __scale);
11287}
11288
11289extern __inline void
11292 __m128 __v1, const int __scale)
11293{
11296 __scale);
11297}
11298
11299extern __inline void
11303 const int __scale)
11304{
11306 (__v4sf) __v1, __scale);
11307}
11308
11309extern __inline void
11312 const int __scale)
11313{
11316 __scale);
11317}
11318
11319extern __inline void
11323 const int __scale)
11324{
11326 (__v4sf) __v1, __scale);
11327}
11328
11329extern __inline void
11332 __m256d __v1, const int __scale)
11333{
11336 __scale);
11337}
11338
11339extern __inline void
11343 const int __scale)
11344{
11346 (__v4df) __v1, __scale);
11347}
11348
11349extern __inline void
11352 __m128d __v1, const int __scale)
11353{
11356 __scale);
11357}
11358
11359extern __inline void
11363 const int __scale)
11364{
11366 (__v2df) __v1, __scale);
11367}
11368
11369extern __inline void
11372 __m256i __v1, const int __scale)
11373{
11376 __scale);
11377}
11378
11379extern __inline void
11383 const int __scale)
11384{
11386 (__v8si) __v1, __scale);
11387}
11388
11389extern __inline void
11392 __m128i __v1, const int __scale)
11393{
11396 __scale);
11397}
11398
11399extern __inline void
11403 const int __scale)
11404{
11406 (__v4si) __v1, __scale);
11407}
11408
11409extern __inline void
11412 __m256i __v1, const int __scale)
11413{
11416 __scale);
11417}
11418
11419extern __inline void
11423 const int __scale)
11424{
11426 (__v4di) __v1, __scale);
11427}
11428
11429extern __inline void
11432 __m128i __v1, const int __scale)
11433{
11436 __scale);
11437}
11438
11439extern __inline void
11443 const int __scale)
11444{
11446 (__v2di) __v1, __scale);
11447}
11448
11449extern __inline void
11452 __m128i __v1, const int __scale)
11453{
11456 __scale);
11457}
11458
11459extern __inline void
11463 const int __scale)
11464{
11466 (__v4si) __v1, __scale);
11467}
11468
11469extern __inline void
11472 __m128i __v1, const int __scale)
11473{
11476 __scale);
11477}
11478
11479extern __inline void
11483 const int __scale)
11484{
11486 (__v4si) __v1, __scale);
11487}
11488
11489extern __inline void
11492 __m256i __v1, const int __scale)
11493{
11496 __scale);
11497}
11498
11499extern __inline void
11503 const int __scale)
11504{
11506 (__v4di) __v1, __scale);
11507}
11508
11509extern __inline void
11512 __m128i __v1, const int __scale)
11513{
11516 __scale);
11517}
11518
11519extern __inline void
11523 const int __scale)
11524{
11526 (__v2di) __v1, __scale);
11527}
11528
11529extern __inline __m256i
11533{
11535 (__v8si) __W,
11536 (__mmask8) __U);
11537}
11538
11539extern __inline __m256i
11543{
11545 (__v8si)
11547 (__mmask8) __U);
11548}
11549
11550extern __inline __m128i
11554{
11556 (__v4si) __W,
11557 (__mmask8) __U);
11558}
11559
11560extern __inline __m128i
11564{
11566 (__v4si)
11568 (__mmask8) __U);
11569}
11570
11571extern __inline __m256i
11573_mm256_rol_epi32 (__m256i __A, const int __B)
11574{
11576 (__v8si)
11578 (__mmask8) -1);
11579}
11580
11581extern __inline __m256i
11584 const int __B)
11585{
11587 (__v8si) __W,
11588 (__mmask8) __U);
11589}
11590
11591extern __inline __m256i
11594{
11596 (__v8si)
11598 (__mmask8) __U);
11599}
11600
11601extern __inline __m128i
11603_mm_rol_epi32 (__m128i __A, const int __B)
11604{
11606 (__v4si)
11608 (__mmask8) -1);
11609}
11610
11611extern __inline __m128i
11614 const int __B)
11615{
11617 (__v4si) __W,
11618 (__mmask8) __U);
11619}
11620
11621extern __inline __m128i
11624{
11626 (__v4si)
11628 (__mmask8) __U);
11629}
11630
11631extern __inline __m256i
11633_mm256_ror_epi32 (__m256i __A, const int __B)
11634{
11636 (__v8si)
11638 (__mmask8) -1);
11639}
11640
11641extern __inline __m256i
11644 const int __B)
11645{
11647 (__v8si) __W,
11648 (__mmask8) __U);
11649}
11650
11651extern __inline __m256i
11654{
11656 (__v8si)
11658 (__mmask8) __U);
11659}
11660
11661extern __inline __m128i
11663_mm_ror_epi32 (__m128i __A, const int __B)
11664{
11666 (__v4si)
11668 (__mmask8) -1);
11669}
11670
11671extern __inline __m128i
11674 const int __B)
11675{
11677 (__v4si) __W,
11678 (__mmask8) __U);
11679}
11680
11681extern __inline __m128i
11684{
11686 (__v4si)
11688 (__mmask8) __U);
11689}
11690
11691extern __inline __m256i
11693_mm256_rol_epi64 (__m256i __A, const int __B)
11694{
11696 (__v4di)
11698 (__mmask8) -1);
11699}
11700
11701extern __inline __m256i
11704 const int __B)
11705{
11707 (__v4di) __W,
11708 (__mmask8) __U);
11709}
11710
11711extern __inline __m256i
11714{
11716 (__v4di)
11718 (__mmask8) __U);
11719}
11720
11721extern __inline __m128i
11723_mm_rol_epi64 (__m128i __A, const int __B)
11724{
11726 (__v2di)
11728 (__mmask8) -1);
11729}
11730
11731extern __inline __m128i
11734 const int __B)
11735{
11737 (__v2di) __W,
11738 (__mmask8) __U);
11739}
11740
11741extern __inline __m128i
11744{
11746 (__v2di)
11748 (__mmask8) __U);
11749}
11750
11751extern __inline __m256i
11753_mm256_ror_epi64 (__m256i __A, const int __B)
11754{
11756 (__v4di)
11758 (__mmask8) -1);
11759}
11760
11761extern __inline __m256i
11764 const int __B)
11765{
11767 (__v4di) __W,
11768 (__mmask8) __U);
11769}
11770
11771extern __inline __m256i
11774{
11776 (__v4di)
11778 (__mmask8) __U);
11779}
11780
11781extern __inline __m128i
11783_mm_ror_epi64 (__m128i __A, const int __B)
11784{
11786 (__v2di)
11788 (__mmask8) -1);
11789}
11790
11791extern __inline __m128i
11794 const int __B)
11795{
11797 (__v2di) __W,
11798 (__mmask8) __U);
11799}
11800
11801extern __inline __m128i
11804{
11806 (__v2di)
11808 (__mmask8) __U);
11809}
11810
11811extern __inline __m128i
11814{
11816 (__v4si) __B, __imm,
11817 (__v4si)
11819 (__mmask8) -1);
11820}
11821
11822extern __inline __m128i
11825 __m128i __B, const int __imm)
11826{
11828 (__v4si) __B, __imm,
11829 (__v4si) __W,
11830 (__mmask8) __U);
11831}
11832
11833extern __inline __m128i
11836 const int __imm)
11837{
11839 (__v4si) __B, __imm,
11840 (__v4si)
11842 (__mmask8) __U);
11843}
11844
11845extern __inline __m128i
11848{
11850 (__v2di) __B, __imm,
11851 (__v2di)
11853 (__mmask8) -1);
11854}
11855
11856extern __inline __m128i
11859 __m128i __B, const int __imm)
11860{
11862 (__v2di) __B, __imm,
11863 (__v2di) __W,
11864 (__mmask8) __U);
11865}
11866
11867extern __inline __m128i
11870 const int __imm)
11871{
11873 (__v2di) __B, __imm,
11874 (__v2di)
11876 (__mmask8) __U);
11877}
11878
11879extern __inline __m256i
11882{
11884 (__v8si) __B, __imm,
11885 (__v8si)
11887 (__mmask8) -1);
11888}
11889
11890extern __inline __m256i
11893 __m256i __B, const int __imm)
11894{
11896 (__v8si) __B, __imm,
11897 (__v8si) __W,
11898 (__mmask8) __U);
11899}
11900
11901extern __inline __m256i
11904 const int __imm)
11905{
11907 (__v8si) __B, __imm,
11908 (__v8si)
11910 (__mmask8) __U);
11911}
11912
11913extern __inline __m256i
11916{
11918 (__v4di) __B, __imm,
11919 (__v4di)
11921 (__mmask8) -1);
11922}
11923
11924extern __inline __m256i
11927 __m256i __B, const int __imm)
11928{
11930 (__v4di) __B, __imm,
11931 (__v4di) __W,
11932 (__mmask8) __U);
11933}
11934
11935extern __inline __m256i
11938 const int __imm)
11939{
11941 (__v4di) __B, __imm,
11942 (__v4di)
11944 (__mmask8) __U);
11945}
11946
11947extern __inline __m128i
11950 const int __I)
11951{
11953 (__v8hi) __W,
11954 (__mmask8) __U);
11955}
11956
11957extern __inline __m128i
11960{
11962 (__v8hi)
11964 (__mmask8) __U);
11965}
11966
11967extern __inline __m128i
11970 const int __I)
11971{
11973 (__v8hi) __W,
11974 (__mmask8) __U);
11975}
11976
11977extern __inline __m128i
11980{
11982 (__v8hi)
11984 (__mmask8) __U);
11985}
11986
11987extern __inline __m256i
11990 const int __imm)
11991{
11993 (__v8si) __W,
11994 (__mmask8) __U);
11995}
11996
11997extern __inline __m256i
12000{
12002 (__v8si)
12004 (__mmask8) __U);
12005}
12006
12007extern __inline __m128i
12010 const int __imm)
12011{
12013 (__v4si) __W,
12014 (__mmask8) __U);
12015}
12016
12017extern __inline __m128i
12020{
12022 (__v4si)
12024 (__mmask8) __U);
12025}
12026
12027extern __inline __m256i
12030{
12032 (__v4di)
12034 (__mmask8) -1);
12035}
12036
12037extern __inline __m256i
12040 const int __imm)
12041{
12043 (__v4di) __W,
12044 (__mmask8) __U);
12045}
12046
12047extern __inline __m256i
12050{
12052 (__v4di)
12054 (__mmask8) __U);
12055}
12056
12057extern __inline __m128i
12059_mm_srai_epi64 (__m128i __A, const int __imm)
12060{
12062 (__v2di)
12064 (__mmask8) -1);
12065}
12066
12067extern __inline __m128i
12070 const int __imm)
12071{
12073 (__v2di) __W,
12074 (__mmask8) __U);
12075}
12076
12077extern __inline __m128i
12080{
12082 (__v2di)
12084 (__mmask8) __U);
12085}
12086
12087extern __inline __m128i
12090{
12092 (__v4si) __W,
12093 (__mmask8) __U);
12094}
12095
12096extern __inline __m128i
12099{
12101 (__v4si)
12103 (__mmask8) __U);
12104}
12105
12106extern __inline __m128i
12109{
12111 (__v2di) __W,
12112 (__mmask8) __U);
12113}
12114
12115extern __inline __m128i
12118{
12120 (__v2di)
12122 (__mmask8) __U);
12123}
12124
12125extern __inline __m256i
12128 int __B)
12129{
12131 (__v8si) __W,
12132 (__mmask8) __U);
12133}
12134
12135extern __inline __m256i
12138{
12140 (__v8si)
12142 (__mmask8) __U);
12143}
12144
12145extern __inline __m256i
12148 int __B)
12149{
12151 (__v4di) __W,
12152 (__mmask8) __U);
12153}
12154
12155extern __inline __m256i
12158{
12160 (__v4di)
12162 (__mmask8) __U);
12163}
12164
12165extern __inline __m256d
12168 const int __imm)
12169{
12171 (__v4df) __W,
12172 (__mmask8) __U);
12173}
12174
12175extern __inline __m256d
12178{
12180 (__v4df)
12182 (__mmask8) __U);
12183}
12184
12185extern __inline __m256d
12188 const int __C)
12189{
12191 (__v4df) __W,
12192 (__mmask8) __U);
12193}
12194
12195extern __inline __m256d
12198{
12200 (__v4df)
12202 (__mmask8) __U);
12203}
12204
12205extern __inline __m128d
12208 const int __C)
12209{
12211 (__v2df) __W,
12212 (__mmask8) __U);
12213}
12214
12215extern __inline __m128d
12218{
12220 (__v2df)
12221 _mm_setzero_pd (),
12222 (__mmask8) __U);
12223}
12224
12225extern __inline __m256
12228 const int __C)
12229{
12231 (__v8sf) __W,
12232 (__mmask8) __U);
12233}
12234
12235extern __inline __m256
12238{
12240 (__v8sf)
12242 (__mmask8) __U);
12243}
12244
12245extern __inline __m128
12248 const int __C)
12249{
12251 (__v4sf) __W,
12252 (__mmask8) __U);
12253}
12254
12255extern __inline __m128
12258{
12260 (__v4sf)
12261 _mm_setzero_ps (),
12262 (__mmask8) __U);
12263}
12264
12265extern __inline __m256d
12268{
12270 (__v4df) __W,
12271 (__mmask8) __U);
12272}
12273
12274extern __inline __m256
12277{
12279 (__v8sf) __W,
12280 (__mmask8) __U);
12281}
12282
12283extern __inline __m256i
12286{
12288 (__v4di) __W,
12289 (__mmask8) __U);
12290}
12291
12292extern __inline __m256i
12295{
12297 (__v8si) __W,
12298 (__mmask8) __U);
12299}
12300
12301extern __inline __m128d
12304{
12306 (__v2df) __W,
12307 (__mmask8) __U);
12308}
12309
12310extern __inline __m128
12313{
12315 (__v4sf) __W,
12316 (__mmask8) __U);
12317}
12318
12319extern __inline __m128i
12322{
12324 (__v2di) __W,
12325 (__mmask8) __U);
12326}
12327
12328extern __inline __m128i
12331{
12333 (__v4si) __W,
12334 (__mmask8) __U);
12335}
12336
12337extern __inline __mmask8
12340{
12342 (__v4di) __Y, __P,
12343 (__mmask8) -1);
12344}
12345
12346extern __inline __mmask8
12349{
12351 (__v8si) __Y, __P,
12352 (__mmask8) -1);
12353}
12354
12355extern __inline __mmask8
12358{
12360 (__v4di) __Y, __P,
12361 (__mmask8) -1);
12362}
12363
12364extern __inline __mmask8
12367{
12369 (__v8si) __Y, __P,
12370 (__mmask8) -1);
12371}
12372
12373extern __inline __mmask8
12376{
12378 (__v4df) __Y, __P,
12379 (__mmask8) -1);
12380}
12381
12382extern __inline __mmask8
12385{
12387 (__v8sf) __Y, __P,
12388 (__mmask8) -1);
12389}
12390
12391extern __inline __mmask8
12394 const int __P)
12395{
12397 (__v4di) __Y, __P,
12398 (__mmask8) __U);
12399}
12400
12401extern __inline __mmask8
12404 const int __P)
12405{
12407 (__v8si) __Y, __P,
12408 (__mmask8) __U);
12409}
12410
12411extern __inline __mmask8
12414 const int __P)
12415{
12417 (__v4di) __Y, __P,
12418 (__mmask8) __U);
12419}
12420
12421extern __inline __mmask8
12424 const int __P)
12425{
12427 (__v8si) __Y, __P,
12428 (__mmask8) __U);
12429}
12430
12431extern __inline __mmask8
12434 const int __P)
12435{
12437 (__v4df) __Y, __P,
12438 (__mmask8) __U);
12439}
12440
12441extern __inline __mmask8
12444 const int __P)
12445{
12447 (__v8sf) __Y, __P,
12448 (__mmask8) __U);
12449}
12450
12451extern __inline __mmask8
12454{
12456 (__v2di) __Y, __P,
12457 (__mmask8) -1);
12458}
12459
12460extern __inline __mmask8
12463{
12465 (__v4si) __Y, __P,
12466 (__mmask8) -1);
12467}
12468
12469extern __inline __mmask8
12472{
12474 (__v2di) __Y, __P,
12475 (__mmask8) -1);
12476}
12477
12478extern __inline __mmask8
12481{
12483 (__v4si) __Y, __P,
12484 (__mmask8) -1);
12485}
12486
12487extern __inline __mmask8
12490{
12492 (__v2df) __Y, __P,
12493 (__mmask8) -1);
12494}
12495
12496extern __inline __mmask8
12498_mm_cmp_ps_mask (__m128 __X, __m128 __Y, const int __P)
12499{
12501 (__v4sf) __Y, __P,
12502 (__mmask8) -1);
12503}
12504
12505extern __inline __mmask8
12508 const int __P)
12509{
12511 (__v2di) __Y, __P,
12512 (__mmask8) __U);
12513}
12514
12515extern __inline __mmask8
12518 const int __P)
12519{
12521 (__v4si) __Y, __P,
12522 (__mmask8) __U);
12523}
12524
12525extern __inline __mmask8
12528 const int __P)
12529{
12531 (__v2di) __Y, __P,
12532 (__mmask8) __U);
12533}
12534
12535extern __inline __mmask8
12538 const int __P)
12539{
12541 (__v4si) __Y, __P,
12542 (__mmask8) __U);
12543}
12544
12545extern __inline __mmask8
12548 const int __P)
12549{
12551 (__v2df) __Y, __P,
12552 (__mmask8) __U);
12553}
12554
12555extern __inline __mmask8
12558 const int __P)
12559{
12561 (__v4sf) __Y, __P,
12562 (__mmask8) __U);
12563}
12564
12565extern __inline __m256d
12567_mm256_permutex_pd (__m256d __X, const int __M)
12568{
12570 (__v4df)
12572 (__mmask8) -1);
12573}
12574
12575#else
12576#define _mm256_permutex_pd(X, M) \
12577 ((__m256d) __builtin_ia32_permdf256_mask ((__v4df)(__m256d)(X), (int)(M), \
12578 (__v4df)(__m256d) \
12579 _mm256_undefined_pd (), \
12580 (__mmask8)-1))
12581
12582#define _mm256_permutex_epi64(X, I) \
12583 ((__m256i) __builtin_ia32_permdi256_mask ((__v4di)(__m256i)(X), \
12584 (int)(I), \
12585 (__v4di)(__m256i) \
12586 (_mm256_setzero_si256 ()),\
12587 (__mmask8) -1))
12588
12589#define _mm256_maskz_permutex_epi64(M, X, I) \
12590 ((__m256i) __builtin_ia32_permdi256_mask ((__v4di)(__m256i)(X), \
12591 (int)(I), \
12592 (__v4di)(__m256i) \
12593 (_mm256_setzero_si256 ()),\
12594 (__mmask8)(M)))
12595
12596#define _mm256_mask_permutex_epi64(W, M, X, I) \
12597 ((__m256i) __builtin_ia32_permdi256_mask ((__v4di)(__m256i)(X), \
12598 (int)(I), \
12599 (__v4di)(__m256i)(W), \
12600 (__mmask8)(M)))
12601
12602#define _mm256_insertf32x4(X, Y, C) \
12603 ((__m256) __builtin_ia32_insertf32x4_256_mask ((__v8sf)(__m256) (X), \
12604 (__v4sf)(__m128) (Y), (int) (C), \
12605 (__v8sf)(__m256)_mm256_setzero_ps (), \
12606 (__mmask8)-1))
12607
12608#define _mm256_mask_insertf32x4(W, U, X, Y, C) \
12609 ((__m256) __builtin_ia32_insertf32x4_256_mask ((__v8sf)(__m256) (X), \
12610 (__v4sf)(__m128) (Y), (int) (C), \
12611 (__v8sf)(__m256)(W), \
12612 (__mmask8)(U)))
12613
12614#define _mm256_maskz_insertf32x4(U, X, Y, C) \
12615 ((__m256) __builtin_ia32_insertf32x4_256_mask ((__v8sf)(__m256) (X), \
12616 (__v4sf)(__m128) (Y), (int) (C), \
12617 (__v8sf)(__m256)_mm256_setzero_ps (), \
12618 (__mmask8)(U)))
12619
12620#define _mm256_inserti32x4(X, Y, C) \
12621 ((__m256i) __builtin_ia32_inserti32x4_256_mask ((__v8si)(__m256i) (X),\
12622 (__v4si)(__m128i) (Y), (int) (C), \
12623 (__v8si)(__m256i)_mm256_setzero_si256 (), \
12624 (__mmask8)-1))
12625
12626#define _mm256_mask_inserti32x4(W, U, X, Y, C) \
12627 ((__m256i) __builtin_ia32_inserti32x4_256_mask ((__v8si)(__m256i) (X),\
12628 (__v4si)(__m128i) (Y), (int) (C), \
12629 (__v8si)(__m256i)(W), \
12630 (__mmask8)(U)))
12631
12632#define _mm256_maskz_inserti32x4(U, X, Y, C) \
12633 ((__m256i) __builtin_ia32_inserti32x4_256_mask ((__v8si)(__m256i) (X),\
12634 (__v4si)(__m128i) (Y), (int) (C), \
12635 (__v8si)(__m256i)_mm256_setzero_si256 (), \
12636 (__mmask8)(U)))
12637
12638#define _mm256_extractf32x4_ps(X, C) \
12639 ((__m128) __builtin_ia32_extractf32x4_256_mask ((__v8sf)(__m256) (X), \
12640 (int) (C), \
12641 (__v4sf)(__m128)_mm_setzero_ps (), \
12642 (__mmask8)-1))
12643
12644#define _mm256_mask_extractf32x4_ps(W, U, X, C) \
12645 ((__m128) __builtin_ia32_extractf32x4_256_mask ((__v8sf)(__m256) (X), \
12646 (int) (C), \
12647 (__v4sf)(__m128)(W), \
12648 (__mmask8)(U)))
12649
12650#define _mm256_maskz_extractf32x4_ps(U, X, C) \
12651 ((__m128) __builtin_ia32_extractf32x4_256_mask ((__v8sf)(__m256) (X), \
12652 (int) (C), \
12653 (__v4sf)(__m128)_mm_setzero_ps (), \
12654 (__mmask8)(U)))
12655
12656#define _mm256_extracti32x4_epi32(X, C) \
12657 ((__m128i) __builtin_ia32_extracti32x4_256_mask ((__v8si)(__m256i) (X),\
12658 (int) (C), (__v4si)(__m128i)_mm_setzero_si128 (), (__mmask8)-1))
12659
12660#define _mm256_mask_extracti32x4_epi32(W, U, X, C) \
12661 ((__m128i) __builtin_ia32_extracti32x4_256_mask ((__v8si)(__m256i) (X),\
12662 (int) (C), (__v4si)(__m128i)(W), (__mmask8)(U)))
12663
12664#define _mm256_maskz_extracti32x4_epi32(U, X, C) \
12665 ((__m128i) __builtin_ia32_extracti32x4_256_mask ((__v8si)(__m256i) (X),\
12666 (int) (C), (__v4si)(__m128i)_mm_setzero_si128 (), (__mmask8)(U)))
12667
12668#define _mm256_shuffle_i64x2(X, Y, C) \
12669 ((__m256i) __builtin_ia32_shuf_i64x2_256_mask ((__v4di)(__m256i)(X), \
12670 (__v4di)(__m256i)(Y), (int)(C), \
12671 (__v4di)(__m256i)_mm256_setzero_si256 (), \
12672 (__mmask8)-1))
12673
12674#define _mm256_mask_shuffle_i64x2(W, U, X, Y, C) \
12675 ((__m256i) __builtin_ia32_shuf_i64x2_256_mask ((__v4di)(__m256i)(X), \
12676 (__v4di)(__m256i)(Y), (int)(C), \
12677 (__v4di)(__m256i)(W),\
12678 (__mmask8)(U)))
12679
12680#define _mm256_maskz_shuffle_i64x2(U, X, Y, C) \
12681 ((__m256i) __builtin_ia32_shuf_i64x2_256_mask ((__v4di)(__m256i)(X), \
12682 (__v4di)(__m256i)(Y), (int)(C), \
12683 (__v4di)(__m256i)_mm256_setzero_si256 (), \
12684 (__mmask8)(U)))
12685
12686#define _mm256_shuffle_i32x4(X, Y, C) \
12687 ((__m256i) __builtin_ia32_shuf_i32x4_256_mask ((__v8si)(__m256i)(X), \
12688 (__v8si)(__m256i)(Y), (int)(C), \
12689 (__v8si)(__m256i) \
12690 _mm256_setzero_si256 (), \
12691 (__mmask8)-1))
12692
12693#define _mm256_mask_shuffle_i32x4(W, U, X, Y, C) \
12694 ((__m256i) __builtin_ia32_shuf_i32x4_256_mask ((__v8si)(__m256i)(X), \
12695 (__v8si)(__m256i)(Y), (int)(C), \
12696 (__v8si)(__m256i)(W), \
12697 (__mmask8)(U)))
12698
12699#define _mm256_maskz_shuffle_i32x4(U, X, Y, C) \
12700 ((__m256i) __builtin_ia32_shuf_i32x4_256_mask ((__v8si)(__m256i)(X), \
12701 (__v8si)(__m256i)(Y), (int)(C), \
12702 (__v8si)(__m256i) \
12703 _mm256_setzero_si256 (), \
12704 (__mmask8)(U)))
12705
12706#define _mm256_shuffle_f64x2(X, Y, C) \
12707 ((__m256d) __builtin_ia32_shuf_f64x2_256_mask ((__v4df)(__m256d)(X), \
12708 (__v4df)(__m256d)(Y), (int)(C), \
12709 (__v4df)(__m256d)_mm256_setzero_pd (),\
12710 (__mmask8)-1))
12711
12712#define _mm256_mask_shuffle_f64x2(W, U, X, Y, C) \
12713 ((__m256d) __builtin_ia32_shuf_f64x2_256_mask ((__v4df)(__m256d)(X), \
12714 (__v4df)(__m256d)(Y), (int)(C), \
12715 (__v4df)(__m256d)(W), \
12716 (__mmask8)(U)))
12717
12718#define _mm256_maskz_shuffle_f64x2(U, X, Y, C) \
12719 ((__m256d) __builtin_ia32_shuf_f64x2_256_mask ((__v4df)(__m256d)(X), \
12720 (__v4df)(__m256d)(Y), (int)(C), \
12721 (__v4df)(__m256d)_mm256_setzero_pd( ),\
12722 (__mmask8)(U)))
12723
12724#define _mm256_shuffle_f32x4(X, Y, C) \
12725 ((__m256) __builtin_ia32_shuf_f32x4_256_mask ((__v8sf)(__m256)(X), \
12726 (__v8sf)(__m256)(Y), (int)(C), \
12727 (__v8sf)(__m256)_mm256_setzero_ps (), \
12728 (__mmask8)-1))
12729
12730#define _mm256_mask_shuffle_f32x4(W, U, X, Y, C) \
12731 ((__m256) __builtin_ia32_shuf_f32x4_256_mask ((__v8sf)(__m256)(X), \
12732 (__v8sf)(__m256)(Y), (int)(C), \
12733 (__v8sf)(__m256)(W), \
12734 (__mmask8)(U)))
12735
12736#define _mm256_maskz_shuffle_f32x4(U, X, Y, C) \
12737 ((__m256) __builtin_ia32_shuf_f32x4_256_mask ((__v8sf)(__m256)(X), \
12738 (__v8sf)(__m256)(Y), (int)(C), \
12739 (__v8sf)(__m256)_mm256_setzero_ps (), \
12740 (__mmask8)(U)))
12741
12742#define _mm256_mask_shuffle_pd(W, U, A, B, C) \
12743 ((__m256d)__builtin_ia32_shufpd256_mask ((__v4df)(__m256d)(A), \
12744 (__v4df)(__m256d)(B), (int)(C), \
12745 (__v4df)(__m256d)(W), \
12746 (__mmask8)(U)))
12747
12748#define _mm256_maskz_shuffle_pd(U, A, B, C) \
12749 ((__m256d)__builtin_ia32_shufpd256_mask ((__v4df)(__m256d)(A), \
12750 (__v4df)(__m256d)(B), (int)(C), \
12751 (__v4df)(__m256d) \
12752 _mm256_setzero_pd (), \
12753 (__mmask8)(U)))
12754
12755#define _mm_mask_shuffle_pd(W, U, A, B, C) \
12756 ((__m128d)__builtin_ia32_shufpd128_mask ((__v2df)(__m128d)(A), \
12757 (__v2df)(__m128d)(B), (int)(C), \
12758 (__v2df)(__m128d)(W), \
12759 (__mmask8)(U)))
12760
12761#define _mm_maskz_shuffle_pd(U, A, B, C) \
12762 ((__m128d)__builtin_ia32_shufpd128_mask ((__v2df)(__m128d)(A), \
12763 (__v2df)(__m128d)(B), (int)(C), \
12764 (__v2df)(__m128d)_mm_setzero_pd (), \
12765 (__mmask8)(U)))
12766
12767#define _mm256_mask_shuffle_ps(W, U, A, B, C) \
12768 ((__m256) __builtin_ia32_shufps256_mask ((__v8sf)(__m256)(A), \
12769 (__v8sf)(__m256)(B), (int)(C), \
12770 (__v8sf)(__m256)(W), \
12771 (__mmask8)(U)))
12772
12773#define _mm256_maskz_shuffle_ps(U, A, B, C) \
12774 ((__m256) __builtin_ia32_shufps256_mask ((__v8sf)(__m256)(A), \
12775 (__v8sf)(__m256)(B), (int)(C), \
12776 (__v8sf)(__m256)_mm256_setzero_ps (),\
12777 (__mmask8)(U)))
12778
12779#define _mm_mask_shuffle_ps(W, U, A, B, C) \
12780 ((__m128) __builtin_ia32_shufps128_mask ((__v4sf)(__m128)(A), \
12781 (__v4sf)(__m128)(B), (int)(C), \
12782 (__v4sf)(__m128)(W), \
12783 (__mmask8)(U)))
12784
12785#define _mm_maskz_shuffle_ps(U, A, B, C) \
12786 ((__m128) __builtin_ia32_shufps128_mask ((__v4sf)(__m128)(A), \
12787 (__v4sf)(__m128)(B), (int)(C), \
12788 (__v4sf)(__m128)_mm_setzero_ps (), \
12789 (__mmask8)(U)))
12790
12791#define _mm256_fixupimm_pd(X, Y, Z, C) \
12792 ((__m256d)__builtin_ia32_fixupimmpd256_mask ((__v4df)(__m256d)(X), \
12793 (__v4df)(__m256d)(Y), \
12794 (__v4di)(__m256i)(Z), (int)(C), \
12795 (__mmask8)(-1)))
12796
12797#define _mm256_mask_fixupimm_pd(X, U, Y, Z, C) \
12798 ((__m256d)__builtin_ia32_fixupimmpd256_mask ((__v4df)(__m256d)(X), \
12799 (__v4df)(__m256d)(Y), \
12800 (__v4di)(__m256i)(Z), (int)(C), \
12801 (__mmask8)(U)))
12802
12803#define _mm256_maskz_fixupimm_pd(U, X, Y, Z, C) \
12804 ((__m256d)__builtin_ia32_fixupimmpd256_maskz ((__v4df)(__m256d)(X), \
12805 (__v4df)(__m256d)(Y), \
12806 (__v4di)(__m256i)(Z), (int)(C),\
12807 (__mmask8)(U)))
12808
12809#define _mm256_fixupimm_ps(X, Y, Z, C) \
12810 ((__m256)__builtin_ia32_fixupimmps256_mask ((__v8sf)(__m256)(X), \
12811 (__v8sf)(__m256)(Y), \
12812 (__v8si)(__m256i)(Z), (int)(C), \
12813 (__mmask8)(-1)))
12814
12815
12816#define _mm256_mask_fixupimm_ps(X, U, Y, Z, C) \
12817 ((__m256)__builtin_ia32_fixupimmps256_mask ((__v8sf)(__m256)(X), \
12818 (__v8sf)(__m256)(Y), \
12819 (__v8si)(__m256i)(Z), (int)(C), \
12820 (__mmask8)(U)))
12821
12822#define _mm256_maskz_fixupimm_ps(U, X, Y, Z, C) \
12823 ((__m256)__builtin_ia32_fixupimmps256_maskz ((__v8sf)(__m256)(X), \
12824 (__v8sf)(__m256)(Y), \
12825 (__v8si)(__m256i)(Z), (int)(C),\
12826 (__mmask8)(U)))
12827
12828#define _mm_fixupimm_pd(X, Y, Z, C) \
12829 ((__m128d)__builtin_ia32_fixupimmpd128_mask ((__v2df)(__m128d)(X), \
12830 (__v2df)(__m128d)(Y), \
12831 (__v2di)(__m128i)(Z), (int)(C), \
12832 (__mmask8)(-1)))
12833
12834
12835#define _mm_mask_fixupimm_pd(X, U, Y, Z, C) \
12836 ((__m128d)__builtin_ia32_fixupimmpd128_mask ((__v2df)(__m128d)(X), \
12837 (__v2df)(__m128d)(Y), \
12838 (__v2di)(__m128i)(Z), (int)(C), \
12839 (__mmask8)(U)))
12840
12841#define _mm_maskz_fixupimm_pd(U, X, Y, Z, C) \
12842 ((__m128d)__builtin_ia32_fixupimmpd128_maskz ((__v2df)(__m128d)(X), \
12843 (__v2df)(__m128d)(Y), \
12844 (__v2di)(__m128i)(Z), (int)(C),\
12845 (__mmask8)(U)))
12846
12847#define _mm_fixupimm_ps(X, Y, Z, C) \
12848 ((__m128)__builtin_ia32_fixupimmps128_mask ((__v4sf)(__m128)(X), \
12849 (__v4sf)(__m128)(Y), \
12850 (__v4si)(__m128i)(Z), (int)(C), \
12851 (__mmask8)(-1)))
12852
12853#define _mm_mask_fixupimm_ps(X, U, Y, Z, C) \
12854 ((__m128)__builtin_ia32_fixupimmps128_mask ((__v4sf)(__m128)(X), \
12855 (__v4sf)(__m128)(Y), \
12856 (__v4si)(__m128i)(Z), (int)(C),\
12857 (__mmask8)(U)))
12858
12859#define _mm_maskz_fixupimm_ps(U, X, Y, Z, C) \
12860 ((__m128)__builtin_ia32_fixupimmps128_maskz ((__v4sf)(__m128)(X), \
12861 (__v4sf)(__m128)(Y), \
12862 (__v4si)(__m128i)(Z), (int)(C),\
12863 (__mmask8)(U)))
12864
12865#define _mm256_mask_srli_epi32(W, U, A, B) \
12866 ((__m256i) __builtin_ia32_psrldi256_mask ((__v8si)(__m256i)(A), \
12867 (int)(B), (__v8si)(__m256i)(W), (__mmask8)(U)))
12868
12869#define _mm256_maskz_srli_epi32(U, A, B) \
12870 ((__m256i) __builtin_ia32_psrldi256_mask ((__v8si)(__m256i)(A), \
12871 (int)(B), (__v8si)_mm256_setzero_si256 (), (__mmask8)(U)))
12872
12873#define _mm_mask_srli_epi32(W, U, A, B) \
12874 ((__m128i) __builtin_ia32_psrldi128_mask ((__v4si)(__m128i)(A), \
12875 (int)(B), (__v4si)(__m128i)(W), (__mmask8)(U)))
12876
12877#define _mm_maskz_srli_epi32(U, A, B) \
12878 ((__m128i) __builtin_ia32_psrldi128_mask ((__v4si)(__m128i)(A), \
12879 (int)(B), (__v4si)_mm_setzero_si128 (), (__mmask8)(U)))
12880
12881#define _mm256_mask_srli_epi64(W, U, A, B) \
12882 ((__m256i) __builtin_ia32_psrlqi256_mask ((__v4di)(__m256i)(A), \
12883 (int)(B), (__v4di)(__m256i)(W), (__mmask8)(U)))
12884
12885#define _mm256_maskz_srli_epi64(U, A, B) \
12886 ((__m256i) __builtin_ia32_psrlqi256_mask ((__v4di)(__m256i)(A), \
12887 (int)(B), (__v4di)_mm256_setzero_si256 (), (__mmask8)(U)))
12888
12889#define _mm_mask_srli_epi64(W, U, A, B) \
12890 ((__m128i) __builtin_ia32_psrlqi128_mask ((__v2di)(__m128i)(A), \
12891 (int)(B), (__v2di)(__m128i)(W), (__mmask8)(U)))
12892
12893#define _mm_maskz_srli_epi64(U, A, B) \
12894 ((__m128i) __builtin_ia32_psrlqi128_mask ((__v2di)(__m128i)(A), \
12895 (int)(B), (__v2di)_mm_setzero_si128 (), (__mmask8)(U)))
12896
12897#define _mm256_mask_slli_epi32(W, U, X, C) \
12898 ((__m256i)__builtin_ia32_pslldi256_mask ((__v8si)(__m256i)(X), (int)(C),\
12899 (__v8si)(__m256i)(W), \
12900 (__mmask8)(U)))
12901
12902#define _mm256_maskz_slli_epi32(U, X, C) \
12903 ((__m256i)__builtin_ia32_pslldi256_mask ((__v8si)(__m256i)(X), (int)(C),\
12904 (__v8si)(__m256i)_mm256_setzero_si256 (), \
12905 (__mmask8)(U)))
12906
12907#define _mm256_mask_slli_epi64(W, U, X, C) \
12908 ((__m256i)__builtin_ia32_psllqi256_mask ((__v4di)(__m256i)(X), (int)(C),\
12909 (__v4di)(__m256i)(W), \
12910 (__mmask8)(U)))
12911
12912#define _mm256_maskz_slli_epi64(U, X, C) \
12913 ((__m256i)__builtin_ia32_psllqi256_mask ((__v4di)(__m256i)(X), (int)(C),\
12914 (__v4di)(__m256i)_mm256_setzero_si256 (), \
12915 (__mmask8)(U)))
12916
12917#define _mm_mask_slli_epi32(W, U, X, C) \
12918 ((__m128i)__builtin_ia32_pslldi128_mask ((__v4si)(__m128i)(X), (int)(C),\
12919 (__v4si)(__m128i)(W),\
12920 (__mmask8)(U)))
12921
12922#define _mm_maskz_slli_epi32(U, X, C) \
12923 ((__m128i)__builtin_ia32_pslldi128_mask ((__v4si)(__m128i)(X), (int)(C),\
12924 (__v4si)(__m128i)_mm_setzero_si128 (),\
12925 (__mmask8)(U)))
12926
12927#define _mm_mask_slli_epi64(W, U, X, C) \
12928 ((__m128i)__builtin_ia32_psllqi128_mask ((__v2di)(__m128i)(X), (int)(C),\
12929 (__v2di)(__m128i)(W),\
12930 (__mmask8)(U)))
12931
12932#define _mm_maskz_slli_epi64(U, X, C) \
12933 ((__m128i)__builtin_ia32_psllqi128_mask ((__v2di)(__m128i)(X), (int)(C),\
12934 (__v2di)(__m128i)_mm_setzero_si128 (),\
12935 (__mmask8)(U)))
12936
12937#define _mm256_ternarylogic_epi64(A, B, C, I) \
12938 ((__m256i) \
12939 __builtin_ia32_pternlogq256_mask ((__v4di) (__m256i) (A), \
12940 (__v4di) (__m256i) (B), \
12941 (__v4di) (__m256i) (C), \
12942 (unsigned char) (I), \
12943 (__mmask8) -1))
12944
12945#define _mm256_mask_ternarylogic_epi64(A, U, B, C, I) \
12946 ((__m256i) \
12947 __builtin_ia32_pternlogq256_mask ((__v4di) (__m256i) (A), \
12948 (__v4di) (__m256i) (B), \
12949 (__v4di) (__m256i) (C), \
12950 (unsigned char) (I), \
12951 (__mmask8) (U)))
12952
12953#define _mm256_maskz_ternarylogic_epi64(U, A, B, C, I) \
12954 ((__m256i) \
12955 __builtin_ia32_pternlogq256_maskz ((__v4di) (__m256i) (A), \
12956 (__v4di) (__m256i) (B), \
12957 (__v4di) (__m256i) (C), \
12958 (unsigned char) (I), \
12959 (__mmask8) (U)))
12960
12961#define _mm256_ternarylogic_epi32(A, B, C, I) \
12962 ((__m256i) \
12963 __builtin_ia32_pternlogd256_mask ((__v8si) (__m256i) (A), \
12964 (__v8si) (__m256i) (B), \
12965 (__v8si) (__m256i) (C), \
12966 (unsigned char) (I), \
12967 (__mmask8) -1))
12968
12969#define _mm256_mask_ternarylogic_epi32(A, U, B, C, I) \
12970 ((__m256i) \
12971 __builtin_ia32_pternlogd256_mask ((__v8si) (__m256i) (A), \
12972 (__v8si) (__m256i) (B), \
12973 (__v8si) (__m256i) (C), \
12974 (unsigned char) (I), \
12975 (__mmask8) (U)))
12976
12977#define _mm256_maskz_ternarylogic_epi32(U, A, B, C, I) \
12978 ((__m256i) \
12979 __builtin_ia32_pternlogd256_maskz ((__v8si) (__m256i) (A), \
12980 (__v8si) (__m256i) (B), \
12981 (__v8si) (__m256i) (C), \
12982 (unsigned char) (I), \
12983 (__mmask8) (U)))
12984
12985#define _mm_ternarylogic_epi64(A, B, C, I) \
12986 ((__m128i) \
12987 __builtin_ia32_pternlogq128_mask ((__v2di) (__m128i) (A), \
12988 (__v2di) (__m128i) (B), \
12989 (__v2di) (__m128i) (C), \
12990 (unsigned char) (I), \
12991 (__mmask8) -1))
12992
12993#define _mm_mask_ternarylogic_epi64(A, U, B, C, I) \
12994 ((__m128i) \
12995 __builtin_ia32_pternlogq128_mask ((__v2di) (__m128i) (A), \
12996 (__v2di) (__m128i) (B), \
12997 (__v2di) (__m128i) (C), \
12998 (unsigned char) (I), \
12999 (__mmask8) (U)))
13000
13001#define _mm_maskz_ternarylogic_epi64(U, A, B, C, I) \
13002 ((__m128i) \
13003 __builtin_ia32_pternlogq128_maskz ((__v2di) (__m128i) (A), \
13004 (__v2di) (__m128i) (B), \
13005 (__v2di) (__m128i) (C), \
13006 (unsigned char) (I), \
13007 (__mmask8) (U)))
13008
13009#define _mm_ternarylogic_epi32(A, B, C, I) \
13010 ((__m128i) \
13011 __builtin_ia32_pternlogd128_mask ((__v4si) (__m128i) (A), \
13012 (__v4si) (__m128i) (B), \
13013 (__v4si) (__m128i) (C), \
13014 (unsigned char) (I), \
13015 (__mmask8) -1))
13016
13017#define _mm_mask_ternarylogic_epi32(A, U, B, C, I) \
13018 ((__m128i) \
13019 __builtin_ia32_pternlogd128_mask ((__v4si) (__m128i) (A), \
13020 (__v4si) (__m128i) (B), \
13021 (__v4si) (__m128i) (C), \
13022 (unsigned char) (I), \
13023 (__mmask8) (U)))
13024
13025#define _mm_maskz_ternarylogic_epi32(U, A, B, C, I) \
13026 ((__m128i) \
13027 __builtin_ia32_pternlogd128_maskz ((__v4si) (__m128i) (A), \
13028 (__v4si) (__m128i) (B), \
13029 (__v4si) (__m128i) (C), \
13030 (unsigned char) (I), \
13031 (__mmask8) (U)))
13032
13033#define _mm256_roundscale_ps(A, B) \
13034 ((__m256) __builtin_ia32_rndscaleps_256_mask ((__v8sf)(__m256)(A), \
13035 (int)(B), (__v8sf)(__m256)_mm256_setzero_ps (), (__mmask8)-1))
13036
13037#define _mm256_mask_roundscale_ps(W, U, A, B) \
13038 ((__m256) __builtin_ia32_rndscaleps_256_mask ((__v8sf)(__m256)(A), \
13039 (int)(B), (__v8sf)(__m256)(W), (__mmask8)(U)))
13040
13041#define _mm256_maskz_roundscale_ps(U, A, B) \
13042 ((__m256) __builtin_ia32_rndscaleps_256_mask ((__v8sf)(__m256)(A), \
13043 (int)(B), (__v8sf)(__m256)_mm256_setzero_ps (), (__mmask8)(U)))
13044
13045#define _mm256_roundscale_pd(A, B) \
13046 ((__m256d) __builtin_ia32_rndscalepd_256_mask ((__v4df)(__m256d)(A), \
13047 (int)(B), (__v4df)(__m256d)_mm256_setzero_pd (), (__mmask8)-1))
13048
13049#define _mm256_mask_roundscale_pd(W, U, A, B) \
13050 ((__m256d) __builtin_ia32_rndscalepd_256_mask ((__v4df)(__m256d)(A), \
13051 (int)(B), (__v4df)(__m256d)(W), (__mmask8)(U)))
13052
13053#define _mm256_maskz_roundscale_pd(U, A, B) \
13054 ((__m256d) __builtin_ia32_rndscalepd_256_mask ((__v4df)(__m256d)(A), \
13055 (int)(B), (__v4df)(__m256d)_mm256_setzero_pd (), (__mmask8)(U)))
13056
13057#define _mm_roundscale_ps(A, B) \
13058 ((__m128) __builtin_ia32_rndscaleps_128_mask ((__v4sf)(__m128)(A), \
13059 (int)(B), (__v4sf)(__m128)_mm_setzero_ps (), (__mmask8)-1))
13060
13061#define _mm_mask_roundscale_ps(W, U, A, B) \
13062 ((__m128) __builtin_ia32_rndscaleps_128_mask ((__v4sf)(__m128)(A), \
13063 (int)(B), (__v4sf)(__m128)(W), (__mmask8)(U)))
13064
13065#define _mm_maskz_roundscale_ps(U, A, B) \
13066 ((__m128) __builtin_ia32_rndscaleps_128_mask ((__v4sf)(__m128)(A), \
13067 (int)(B), (__v4sf)(__m128)_mm_setzero_ps (), (__mmask8)(U)))
13068
13069#define _mm_roundscale_pd(A, B) \
13070 ((__m128d) __builtin_ia32_rndscalepd_128_mask ((__v2df)(__m128d)(A), \
13071 (int)(B), (__v2df)(__m128d)_mm_setzero_pd (), (__mmask8)-1))
13072
13073#define _mm_mask_roundscale_pd(W, U, A, B) \
13074 ((__m128d) __builtin_ia32_rndscalepd_128_mask ((__v2df)(__m128d)(A), \
13075 (int)(B), (__v2df)(__m128d)(W), (__mmask8)(U)))
13076
13077#define _mm_maskz_roundscale_pd(U, A, B) \
13078 ((__m128d) __builtin_ia32_rndscalepd_128_mask ((__v2df)(__m128d)(A), \
13079 (int)(B), (__v2df)(__m128d)_mm_setzero_pd (), (__mmask8)(U)))
13080
13081#define _mm256_getmant_ps(X, B, C) \
13082 ((__m256) __builtin_ia32_getmantps256_mask ((__v8sf)(__m256) (X), \
13083 (int)(((C)<<2) | (B)), \
13084 (__v8sf)(__m256)_mm256_setzero_ps (), \
13085 (__mmask8)-1))
13086
13087#define _mm256_mask_getmant_ps(W, U, X, B, C) \
13088 ((__m256) __builtin_ia32_getmantps256_mask ((__v8sf)(__m256) (X), \
13089 (int)(((C)<<2) | (B)), \
13090 (__v8sf)(__m256)(W), \
13091 (__mmask8)(U)))
13092
13093#define _mm256_maskz_getmant_ps(U, X, B, C) \
13094 ((__m256) __builtin_ia32_getmantps256_mask ((__v8sf)(__m256) (X), \
13095 (int)(((C)<<2) | (B)), \
13096 (__v8sf)(__m256)_mm256_setzero_ps (), \
13097 (__mmask8)(U)))
13098
13099#define _mm_getmant_ps(X, B, C) \
13100 ((__m128) __builtin_ia32_getmantps128_mask ((__v4sf)(__m128) (X), \
13101 (int)(((C)<<2) | (B)), \
13102 (__v4sf)(__m128)_mm_setzero_ps (), \
13103 (__mmask8)-1))
13104
13105#define _mm_mask_getmant_ps(W, U, X, B, C) \
13106 ((__m128) __builtin_ia32_getmantps128_mask ((__v4sf)(__m128) (X), \
13107 (int)(((C)<<2) | (B)), \
13108 (__v4sf)(__m128)(W), \
13109 (__mmask8)(U)))
13110
13111#define _mm_maskz_getmant_ps(U, X, B, C) \
13112 ((__m128) __builtin_ia32_getmantps128_mask ((__v4sf)(__m128) (X), \
13113 (int)(((C)<<2) | (B)), \
13114 (__v4sf)(__m128)_mm_setzero_ps (), \
13115 (__mmask8)(U)))
13116
13117#define _mm256_getmant_pd(X, B, C) \
13118 ((__m256d) __builtin_ia32_getmantpd256_mask ((__v4df)(__m256d) (X), \
13119 (int)(((C)<<2) | (B)), \
13120 (__v4df)(__m256d)_mm256_setzero_pd (),\
13121 (__mmask8)-1))
13122
13123#define _mm256_mask_getmant_pd(W, U, X, B, C) \
13124 ((__m256d) __builtin_ia32_getmantpd256_mask ((__v4df)(__m256d) (X), \
13125 (int)(((C)<<2) | (B)), \
13126 (__v4df)(__m256d)(W), \
13127 (__mmask8)(U)))
13128
13129#define _mm256_maskz_getmant_pd(U, X, B, C) \
13130 ((__m256d) __builtin_ia32_getmantpd256_mask ((__v4df)(__m256d) (X), \
13131 (int)(((C)<<2) | (B)), \
13132 (__v4df)(__m256d)_mm256_setzero_pd (),\
13133 (__mmask8)(U)))
13134
13135#define _mm_getmant_pd(X, B, C) \
13136 ((__m128d) __builtin_ia32_getmantpd128_mask ((__v2df)(__m128d) (X), \
13137 (int)(((C)<<2) | (B)), \
13138 (__v2df)(__m128d)_mm_setzero_pd (), \
13139 (__mmask8)-1))
13140
13141#define _mm_mask_getmant_pd(W, U, X, B, C) \
13142 ((__m128d) __builtin_ia32_getmantpd128_mask ((__v2df)(__m128d) (X), \
13143 (int)(((C)<<2) | (B)), \
13144 (__v2df)(__m128d)(W), \
13145 (__mmask8)(U)))
13146
13147#define _mm_maskz_getmant_pd(U, X, B, C) \
13148 ((__m128d) __builtin_ia32_getmantpd128_mask ((__v2df)(__m128d) (X), \
13149 (int)(((C)<<2) | (B)), \
13150 (__v2df)(__m128d)_mm_setzero_pd (), \
13151 (__mmask8)(U)))
13152
13153#define _mm256_mmask_i32gather_ps(V1OLD, MASK, INDEX, ADDR, SCALE) \
13154 (__m256) __builtin_ia32_gather3siv8sf ((__v8sf)(__m256) (V1OLD), \
13155 (void const *) (ADDR), \
13156 (__v8si)(__m256i) (INDEX), \
13157 (__mmask8) (MASK), \
13158 (int) (SCALE))
13159
13160#define _mm_mmask_i32gather_ps(V1OLD, MASK, INDEX, ADDR, SCALE) \
13161 (__m128) __builtin_ia32_gather3siv4sf ((__v4sf)(__m128) (V1OLD), \
13162 (void const *) (ADDR), \
13163 (__v4si)(__m128i) (INDEX), \
13164 (__mmask8) (MASK), \
13165 (int) (SCALE))
13166
13167#define _mm256_mmask_i32gather_pd(V1OLD, MASK, INDEX, ADDR, SCALE) \
13168 (__m256d) __builtin_ia32_gather3siv4df ((__v4df)(__m256d) (V1OLD), \
13169 (void const *) (ADDR), \
13170 (__v4si)(__m128i) (INDEX), \
13171 (__mmask8) (MASK), \
13172 (int) (SCALE))
13173
13174#define _mm_mmask_i32gather_pd(V1OLD, MASK, INDEX, ADDR, SCALE) \
13175 (__m128d) __builtin_ia32_gather3siv2df ((__v2df)(__m128d) (V1OLD), \
13176 (void const *) (ADDR), \
13177 (__v4si)(__m128i) (INDEX), \
13178 (__mmask8) (MASK), \
13179 (int) (SCALE))
13180
13181#define _mm256_mmask_i64gather_ps(V1OLD, MASK, INDEX, ADDR, SCALE) \
13182 (__m128) __builtin_ia32_gather3div8sf ((__v4sf)(__m128) (V1OLD), \
13183 (void const *) (ADDR), \
13184 (__v4di)(__m256i) (INDEX), \
13185 (__mmask8) (MASK), \
13186 (int) (SCALE))
13187
13188#define _mm_mmask_i64gather_ps(V1OLD, MASK, INDEX, ADDR, SCALE) \
13189 (__m128) __builtin_ia32_gather3div4sf ((__v4sf)(__m128) (V1OLD), \
13190 (void const *) (ADDR), \
13191 (__v2di)(__m128i) (INDEX), \
13192 (__mmask8) (MASK), \
13193 (int) (SCALE))
13194
13195#define _mm256_mmask_i64gather_pd(V1OLD, MASK, INDEX, ADDR, SCALE) \
13196 (__m256d) __builtin_ia32_gather3div4df ((__v4df)(__m256d) (V1OLD), \
13197 (void const *) (ADDR), \
13198 (__v4di)(__m256i) (INDEX), \
13199 (__mmask8) (MASK), \
13200 (int) (SCALE))
13201
13202#define _mm_mmask_i64gather_pd(V1OLD, MASK, INDEX, ADDR, SCALE) \
13203 (__m128d) __builtin_ia32_gather3div2df ((__v2df)(__m128d) (V1OLD), \
13204 (void const *) (ADDR), \
13205 (__v2di)(__m128i) (INDEX), \
13206 (__mmask8) (MASK), \
13207 (int) (SCALE))
13208
13209#define _mm256_mmask_i32gather_epi32(V1OLD, MASK, INDEX, ADDR, SCALE) \
13210 (__m256i) __builtin_ia32_gather3siv8si ((__v8si)(__m256i) (V1OLD), \
13211 (void const *) (ADDR), \
13212 (__v8si)(__m256i) (INDEX), \
13213 (__mmask8) (MASK), \
13214 (int) (SCALE))
13215
13216#define _mm_mmask_i32gather_epi32(V1OLD, MASK, INDEX, ADDR, SCALE) \
13217 (__m128i) __builtin_ia32_gather3siv4si ((__v4si)(__m128i) (V1OLD), \
13218 (void const *) (ADDR), \
13219 (__v4si)(__m128i) (INDEX), \
13220 (__mmask8) (MASK), \
13221 (int) (SCALE))
13222
13223#define _mm256_mmask_i32gather_epi64(V1OLD, MASK, INDEX, ADDR, SCALE) \
13224 (__m256i) __builtin_ia32_gather3siv4di ((__v4di)(__m256i) (V1OLD), \
13225 (void const *) (ADDR), \
13226 (__v4si)(__m128i) (INDEX), \
13227 (__mmask8) (MASK), \
13228 (int) (SCALE))
13229
13230#define _mm_mmask_i32gather_epi64(V1OLD, MASK, INDEX, ADDR, SCALE) \
13231 (__m128i) __builtin_ia32_gather3siv2di ((__v2di)(__m128i) (V1OLD), \
13232 (void const *) (ADDR), \
13233 (__v4si)(__m128i) (INDEX), \
13234 (__mmask8) (MASK), \
13235 (int) (SCALE))
13236
13237#define _mm256_mmask_i64gather_epi32(V1OLD, MASK, INDEX, ADDR, SCALE) \
13238 (__m128i) __builtin_ia32_gather3div8si ((__v4si)(__m128i) (V1OLD), \
13239 (void const *) (ADDR), \
13240 (__v4di)(__m256i) (INDEX), \
13241 (__mmask8) (MASK), \
13242 (int) (SCALE))
13243
13244#define _mm_mmask_i64gather_epi32(V1OLD, MASK, INDEX, ADDR, SCALE) \
13245 (__m128i) __builtin_ia32_gather3div4si ((__v4si)(__m128i) (V1OLD), \
13246 (void const *) (ADDR), \
13247 (__v2di)(__m128i) (INDEX), \
13248 (__mmask8) (MASK), \
13249 (int) (SCALE))
13250
13251#define _mm256_mmask_i64gather_epi64(V1OLD, MASK, INDEX, ADDR, SCALE) \
13252 (__m256i) __builtin_ia32_gather3div4di ((__v4di)(__m256i) (V1OLD), \
13253 (void const *) (ADDR), \
13254 (__v4di)(__m256i) (INDEX), \
13255 (__mmask8) (MASK), \
13256 (int) (SCALE))
13257
13258#define _mm_mmask_i64gather_epi64(V1OLD, MASK, INDEX, ADDR, SCALE) \
13259 (__m128i) __builtin_ia32_gather3div2di ((__v2di)(__m128i) (V1OLD), \
13260 (void const *) (ADDR), \
13261 (__v2di)(__m128i) (INDEX), \
13262 (__mmask8) (MASK), \
13263 (int) (SCALE))
13264
13265#define _mm256_i32scatter_ps(ADDR, INDEX, V1, SCALE) \
13266 __builtin_ia32_scattersiv8sf ((void *) (ADDR), (__mmask8)0xFF, \
13267 (__v8si)(__m256i) (INDEX), \
13268 (__v8sf)(__m256) (V1), (int) (SCALE))
13269
13270#define _mm256_mask_i32scatter_ps(ADDR, MASK, INDEX, V1, SCALE) \
13271 __builtin_ia32_scattersiv8sf ((void *) (ADDR), (__mmask8) (MASK), \
13272 (__v8si)(__m256i) (INDEX), \
13273 (__v8sf)(__m256) (V1), (int) (SCALE))
13274
13275#define _mm_i32scatter_ps(ADDR, INDEX, V1, SCALE) \
13276 __builtin_ia32_scattersiv4sf ((void *) (ADDR), (__mmask8)0xFF, \
13277 (__v4si)(__m128i) (INDEX), \
13278 (__v4sf)(__m128) (V1), (int) (SCALE))
13279
13280#define _mm_mask_i32scatter_ps(ADDR, MASK, INDEX, V1, SCALE) \
13281 __builtin_ia32_scattersiv4sf ((void *) (ADDR), (__mmask8) (MASK), \
13282 (__v4si)(__m128i) (INDEX), \
13283 (__v4sf)(__m128) (V1), (int) (SCALE))
13284
13285#define _mm256_i32scatter_pd(ADDR, INDEX, V1, SCALE) \
13286 __builtin_ia32_scattersiv4df ((void *) (ADDR), (__mmask8)0xFF, \
13287 (__v4si)(__m128i) (INDEX), \
13288 (__v4df)(__m256d) (V1), (int) (SCALE))
13289
13290#define _mm256_mask_i32scatter_pd(ADDR, MASK, INDEX, V1, SCALE) \
13291 __builtin_ia32_scattersiv4df ((void *) (ADDR), (__mmask8) (MASK), \
13292 (__v4si)(__m128i) (INDEX), \
13293 (__v4df)(__m256d) (V1), (int) (SCALE))
13294
13295#define _mm_i32scatter_pd(ADDR, INDEX, V1, SCALE) \
13296 __builtin_ia32_scattersiv2df ((void *) (ADDR), (__mmask8)0xFF, \
13297 (__v4si)(__m128i) (INDEX), \
13298 (__v2df)(__m128d) (V1), (int) (SCALE))
13299
13300#define _mm_mask_i32scatter_pd(ADDR, MASK, INDEX, V1, SCALE) \
13301 __builtin_ia32_scattersiv2df ((void *) (ADDR), (__mmask8) (MASK), \
13302 (__v4si)(__m128i) (INDEX), \
13303 (__v2df)(__m128d) (V1), (int) (SCALE))
13304
13305#define _mm256_i64scatter_ps(ADDR, INDEX, V1, SCALE) \
13306 __builtin_ia32_scatterdiv8sf ((void *) (ADDR), (__mmask8)0xFF, \
13307 (__v4di)(__m256i) (INDEX), \
13308 (__v4sf)(__m128) (V1), (int) (SCALE))
13309
13310#define _mm256_mask_i64scatter_ps(ADDR, MASK, INDEX, V1, SCALE) \
13311 __builtin_ia32_scatterdiv8sf ((void *) (ADDR), (__mmask8) (MASK), \
13312 (__v4di)(__m256i) (INDEX), \
13313 (__v4sf)(__m128) (V1), (int) (SCALE))
13314
13315#define _mm_i64scatter_ps(ADDR, INDEX, V1, SCALE) \
13316 __builtin_ia32_scatterdiv4sf ((void *) (ADDR), (__mmask8)0xFF, \
13317 (__v2di)(__m128i) (INDEX), \
13318 (__v4sf)(__m128) (V1), (int) (SCALE))
13319
13320#define _mm_mask_i64scatter_ps(ADDR, MASK, INDEX, V1, SCALE) \
13321 __builtin_ia32_scatterdiv4sf ((void *) (ADDR), (__mmask8) (MASK), \
13322 (__v2di)(__m128i) (INDEX), \
13323 (__v4sf)(__m128) (V1), (int) (SCALE))
13324
13325#define _mm256_i64scatter_pd(ADDR, INDEX, V1, SCALE) \
13326 __builtin_ia32_scatterdiv4df ((void *) (ADDR), (__mmask8)0xFF, \
13327 (__v4di)(__m256i) (INDEX), \
13328 (__v4df)(__m256d) (V1), (int) (SCALE))
13329
13330#define _mm256_mask_i64scatter_pd(ADDR, MASK, INDEX, V1, SCALE) \
13331 __builtin_ia32_scatterdiv4df ((void *) (ADDR), (__mmask8) (MASK), \
13332 (__v4di)(__m256i) (INDEX), \
13333 (__v4df)(__m256d) (V1), (int) (SCALE))
13334
13335#define _mm_i64scatter_pd(ADDR, INDEX, V1, SCALE) \
13336 __builtin_ia32_scatterdiv2df ((void *) (ADDR), (__mmask8)0xFF, \
13337 (__v2di)(__m128i) (INDEX), \
13338 (__v2df)(__m128d) (V1), (int) (SCALE))
13339
13340#define _mm_mask_i64scatter_pd(ADDR, MASK, INDEX, V1, SCALE) \
13341 __builtin_ia32_scatterdiv2df ((void *) (ADDR), (__mmask8) (MASK), \
13342 (__v2di)(__m128i) (INDEX), \
13343 (__v2df)(__m128d) (V1), (int) (SCALE))
13344
13345#define _mm256_i32scatter_epi32(ADDR, INDEX, V1, SCALE) \
13346 __builtin_ia32_scattersiv8si ((void *) (ADDR), (__mmask8)0xFF, \
13347 (__v8si)(__m256i) (INDEX), \
13348 (__v8si)(__m256i) (V1), (int) (SCALE))
13349
13350#define _mm256_mask_i32scatter_epi32(ADDR, MASK, INDEX, V1, SCALE) \
13351 __builtin_ia32_scattersiv8si ((void *) (ADDR), (__mmask8) (MASK), \
13352 (__v8si)(__m256i) (INDEX), \
13353 (__v8si)(__m256i) (V1), (int) (SCALE))
13354
13355#define _mm_i32scatter_epi32(ADDR, INDEX, V1, SCALE) \
13356 __builtin_ia32_scattersiv4si ((void *) (ADDR), (__mmask8)0xFF, \
13357 (__v4si)(__m128i) (INDEX), \
13358 (__v4si)(__m128i) (V1), (int) (SCALE))
13359
13360#define _mm_mask_i32scatter_epi32(ADDR, MASK, INDEX, V1, SCALE) \
13361 __builtin_ia32_scattersiv4si ((void *) (ADDR), (__mmask8) (MASK), \
13362 (__v4si)(__m128i) (INDEX), \
13363 (__v4si)(__m128i) (V1), (int) (SCALE))
13364
13365#define _mm256_i32scatter_epi64(ADDR, INDEX, V1, SCALE) \
13366 __builtin_ia32_scattersiv4di ((void *) (ADDR), (__mmask8)0xFF, \
13367 (__v4si)(__m128i) (INDEX), \
13368 (__v4di)(__m256i) (V1), (int) (SCALE))
13369
13370#define _mm256_mask_i32scatter_epi64(ADDR, MASK, INDEX, V1, SCALE) \
13371 __builtin_ia32_scattersiv4di ((void *) (ADDR), (__mmask8) (MASK), \
13372 (__v4si)(__m128i) (INDEX), \
13373 (__v4di)(__m256i) (V1), (int) (SCALE))
13374
13375#define _mm_i32scatter_epi64(ADDR, INDEX, V1, SCALE) \
13376 __builtin_ia32_scattersiv2di ((void *) (ADDR), (__mmask8)0xFF, \
13377 (__v4si)(__m128i) (INDEX), \
13378 (__v2di)(__m128i) (V1), (int) (SCALE))
13379
13380#define _mm_mask_i32scatter_epi64(ADDR, MASK, INDEX, V1, SCALE) \
13381 __builtin_ia32_scattersiv2di ((void *) (ADDR), (__mmask8) (MASK), \
13382 (__v4si)(__m128i) (INDEX), \
13383 (__v2di)(__m128i) (V1), (int) (SCALE))
13384
13385#define _mm256_i64scatter_epi32(ADDR, INDEX, V1, SCALE) \
13386 __builtin_ia32_scatterdiv8si ((void *) (ADDR), (__mmask8)0xFF, \
13387 (__v4di)(__m256i) (INDEX), \
13388 (__v4si)(__m128i) (V1), (int) (SCALE))
13389
13390#define _mm256_mask_i64scatter_epi32(ADDR, MASK, INDEX, V1, SCALE) \
13391 __builtin_ia32_scatterdiv8si ((void *) (ADDR), (__mmask8) (MASK), \
13392 (__v4di)(__m256i) (INDEX), \
13393 (__v4si)(__m128i) (V1), (int) (SCALE))
13394
13395#define _mm_i64scatter_epi32(ADDR, INDEX, V1, SCALE) \
13396 __builtin_ia32_scatterdiv4si ((void *) (ADDR), (__mmask8)0xFF, \
13397 (__v2di)(__m128i) (INDEX), \
13398 (__v4si)(__m128i) (V1), (int) (SCALE))
13399
13400#define _mm_mask_i64scatter_epi32(ADDR, MASK, INDEX, V1, SCALE) \
13401 __builtin_ia32_scatterdiv4si ((void *) (ADDR), (__mmask8) (MASK), \
13402 (__v2di)(__m128i) (INDEX), \
13403 (__v4si)(__m128i) (V1), (int) (SCALE))
13404
13405#define _mm256_i64scatter_epi64(ADDR, INDEX, V1, SCALE) \
13406 __builtin_ia32_scatterdiv4di ((void *) (ADDR), (__mmask8)0xFF, \
13407 (__v4di)(__m256i) (INDEX), \
13408 (__v4di)(__m256i) (V1), (int) (SCALE))
13409
13410#define _mm256_mask_i64scatter_epi64(ADDR, MASK, INDEX, V1, SCALE) \
13411 __builtin_ia32_scatterdiv4di ((void *) (ADDR), (__mmask8) (MASK), \
13412 (__v4di)(__m256i) (INDEX), \
13413 (__v4di)(__m256i) (V1), (int) (SCALE))
13414
13415#define _mm_i64scatter_epi64(ADDR, INDEX, V1, SCALE) \
13416 __builtin_ia32_scatterdiv2di ((void *) (ADDR), (__mmask8)0xFF, \
13417 (__v2di)(__m128i) (INDEX), \
13418 (__v2di)(__m128i) (V1), (int) (SCALE))
13419
13420#define _mm_mask_i64scatter_epi64(ADDR, MASK, INDEX, V1, SCALE) \
13421 __builtin_ia32_scatterdiv2di ((void *) (ADDR), (__mmask8) (MASK), \
13422 (__v2di)(__m128i) (INDEX), \
13423 (__v2di)(__m128i) (V1), (int) (SCALE))
13424
13425#define _mm256_mask_shuffle_epi32(W, U, X, C) \
13426 ((__m256i) __builtin_ia32_pshufd256_mask ((__v8si)(__m256i)(X), (int)(C), \
13427 (__v8si)(__m256i)(W), \
13428 (__mmask8)(U)))
13429
13430#define _mm256_maskz_shuffle_epi32(U, X, C) \
13431 ((__m256i) __builtin_ia32_pshufd256_mask ((__v8si)(__m256i)(X), (int)(C), \
13432 (__v8si)(__m256i) \
13433 _mm256_setzero_si256 (), \
13434 (__mmask8)(U)))
13435
13436#define _mm_mask_shuffle_epi32(W, U, X, C) \
13437 ((__m128i) __builtin_ia32_pshufd128_mask ((__v4si)(__m128i)(X), (int)(C), \
13438 (__v4si)(__m128i)(W), \
13439 (__mmask8)(U)))
13440
13441#define _mm_maskz_shuffle_epi32(U, X, C) \
13442 ((__m128i) __builtin_ia32_pshufd128_mask ((__v4si)(__m128i)(X), (int)(C), \
13443 (__v4si)(__m128i)_mm_setzero_si128 (), \
13444 (__mmask8)(U)))
13445
13446#define _mm256_rol_epi64(A, B) \
13447 ((__m256i)__builtin_ia32_prolq256_mask ((__v4di)(__m256i)(A), (int)(B), \
13448 (__v4di)(__m256i)_mm256_setzero_si256 (),\
13449 (__mmask8)-1))
13450
13451#define _mm256_mask_rol_epi64(W, U, A, B) \
13452 ((__m256i)__builtin_ia32_prolq256_mask ((__v4di)(__m256i)(A), (int)(B), \
13453 (__v4di)(__m256i)(W), \
13454 (__mmask8)(U)))
13455
13456#define _mm256_maskz_rol_epi64(U, A, B) \
13457 ((__m256i)__builtin_ia32_prolq256_mask ((__v4di)(__m256i)(A), (int)(B), \
13458 (__v4di)(__m256i)_mm256_setzero_si256 (),\
13459 (__mmask8)(U)))
13460
13461#define _mm_rol_epi64(A, B) \
13462 ((__m128i)__builtin_ia32_prolq128_mask ((__v2di)(__m128i)(A), (int)(B), \
13463 (__v2di)(__m128i)_mm_setzero_si128 (),\
13464 (__mmask8)-1))
13465
13466#define _mm_mask_rol_epi64(W, U, A, B) \
13467 ((__m128i)__builtin_ia32_prolq128_mask ((__v2di)(__m128i)(A), (int)(B), \
13468 (__v2di)(__m128i)(W), \
13469 (__mmask8)(U)))
13470
13471#define _mm_maskz_rol_epi64(U, A, B) \
13472 ((__m128i)__builtin_ia32_prolq128_mask ((__v2di)(__m128i)(A), (int)(B), \
13473 (__v2di)(__m128i)_mm_setzero_si128 (),\
13474 (__mmask8)(U)))
13475
13476#define _mm256_ror_epi64(A, B) \
13477 ((__m256i)__builtin_ia32_prorq256_mask ((__v4di)(__m256i)(A), (int)(B), \
13478 (__v4di)(__m256i)_mm256_setzero_si256 (),\
13479 (__mmask8)-1))
13480
13481#define _mm256_mask_ror_epi64(W, U, A, B) \
13482 ((__m256i)__builtin_ia32_prorq256_mask ((__v4di)(__m256i)(A), (int)(B), \
13483 (__v4di)(__m256i)(W), \
13484 (__mmask8)(U)))
13485
13486#define _mm256_maskz_ror_epi64(U, A, B) \
13487 ((__m256i)__builtin_ia32_prorq256_mask ((__v4di)(__m256i)(A), (int)(B), \
13488 (__v4di)(__m256i)_mm256_setzero_si256 (),\
13489 (__mmask8)(U)))
13490
13491#define _mm_ror_epi64(A, B) \
13492 ((__m128i)__builtin_ia32_prorq128_mask ((__v2di)(__m128i)(A), (int)(B), \
13493 (__v2di)(__m128i)_mm_setzero_si128 (),\
13494 (__mmask8)-1))
13495
13496#define _mm_mask_ror_epi64(W, U, A, B) \
13497 ((__m128i)__builtin_ia32_prorq128_mask ((__v2di)(__m128i)(A), (int)(B), \
13498 (__v2di)(__m128i)(W), \
13499 (__mmask8)(U)))
13500
13501#define _mm_maskz_ror_epi64(U, A, B) \
13502 ((__m128i)__builtin_ia32_prorq128_mask ((__v2di)(__m128i)(A), (int)(B), \
13503 (__v2di)(__m128i)_mm_setzero_si128 (),\
13504 (__mmask8)(U)))
13505
13506#define _mm256_rol_epi32(A, B) \
13507 ((__m256i)__builtin_ia32_prold256_mask ((__v8si)(__m256i)(A), (int)(B), \
13508 (__v8si)(__m256i)_mm256_setzero_si256 (),\
13509 (__mmask8)-1))
13510
13511#define _mm256_mask_rol_epi32(W, U, A, B) \
13512 ((__m256i)__builtin_ia32_prold256_mask ((__v8si)(__m256i)(A), (int)(B), \
13513 (__v8si)(__m256i)(W), \
13514 (__mmask8)(U)))
13515
13516#define _mm256_maskz_rol_epi32(U, A, B) \
13517 ((__m256i)__builtin_ia32_prold256_mask ((__v8si)(__m256i)(A), (int)(B), \
13518 (__v8si)(__m256i)_mm256_setzero_si256 (),\
13519 (__mmask8)(U)))
13520
13521#define _mm_rol_epi32(A, B) \
13522 ((__m128i)__builtin_ia32_prold128_mask ((__v4si)(__m128i)(A), (int)(B), \
13523 (__v4si)(__m128i)_mm_setzero_si128 (),\
13524 (__mmask8)-1))
13525
13526#define _mm_mask_rol_epi32(W, U, A, B) \
13527 ((__m128i)__builtin_ia32_prold128_mask ((__v4si)(__m128i)(A), (int)(B), \
13528 (__v4si)(__m128i)(W), \
13529 (__mmask8)(U)))
13530
13531#define _mm_maskz_rol_epi32(U, A, B) \
13532 ((__m128i)__builtin_ia32_prold128_mask ((__v4si)(__m128i)(A), (int)(B), \
13533 (__v4si)(__m128i)_mm_setzero_si128 (),\
13534 (__mmask8)(U)))
13535
13536#define _mm256_ror_epi32(A, B) \
13537 ((__m256i)__builtin_ia32_prord256_mask ((__v8si)(__m256i)(A), (int)(B), \
13538 (__v8si)(__m256i)_mm256_setzero_si256 (),\
13539 (__mmask8)-1))
13540
13541#define _mm256_mask_ror_epi32(W, U, A, B) \
13542 ((__m256i)__builtin_ia32_prord256_mask ((__v8si)(__m256i)(A), (int)(B), \
13543 (__v8si)(__m256i)(W), \
13544 (__mmask8)(U)))
13545
13546#define _mm256_maskz_ror_epi32(U, A, B) \
13547 ((__m256i)__builtin_ia32_prord256_mask ((__v8si)(__m256i)(A), (int)(B), \
13548 (__v8si)(__m256i) \
13549 _mm256_setzero_si256 (), \
13550 (__mmask8)(U)))
13551
13552#define _mm_ror_epi32(A, B) \
13553 ((__m128i)__builtin_ia32_prord128_mask ((__v4si)(__m128i)(A), (int)(B), \
13554 (__v4si)(__m128i)_mm_setzero_si128 (),\
13555 (__mmask8)-1))
13556
13557#define _mm_mask_ror_epi32(W, U, A, B) \
13558 ((__m128i)__builtin_ia32_prord128_mask ((__v4si)(__m128i)(A), (int)(B), \
13559 (__v4si)(__m128i)(W), \
13560 (__mmask8)(U)))
13561
13562#define _mm_maskz_ror_epi32(U, A, B) \
13563 ((__m128i)__builtin_ia32_prord128_mask ((__v4si)(__m128i)(A), (int)(B), \
13564 (__v4si)(__m128i)_mm_setzero_si128 (),\
13565 (__mmask8)(U)))
13566
13567#define _mm256_alignr_epi32(X, Y, C) \
13568 ((__m256i)__builtin_ia32_alignd256_mask ((__v8si)(__m256i)(X), \
13569 (__v8si)(__m256i)(Y), (int)(C), (__v8si)(__m256i)(X), (__mmask8)-1))
13570
13571#define _mm256_mask_alignr_epi32(W, U, X, Y, C) \
13572 ((__m256i)__builtin_ia32_alignd256_mask ((__v8si)(__m256i)(X), \
13573 (__v8si)(__m256i)(Y), (int)(C), (__v8si)(__m256i)(W), (__mmask8)(U)))
13574
13575#define _mm256_maskz_alignr_epi32(U, X, Y, C) \
13576 ((__m256i)__builtin_ia32_alignd256_mask ((__v8si)(__m256i)(X), \
13577 (__v8si)(__m256i)(Y), (int)(C), (__v8si)(__m256i)_mm256_setzero_si256 (),\
13578 (__mmask8)(U)))
13579
13580#define _mm256_alignr_epi64(X, Y, C) \
13581 ((__m256i)__builtin_ia32_alignq256_mask ((__v4di)(__m256i)(X), \
13582 (__v4di)(__m256i)(Y), (int)(C), (__v4di)(__m256i)(X), (__mmask8)-1))
13583
13584#define _mm256_mask_alignr_epi64(W, U, X, Y, C) \
13585 ((__m256i)__builtin_ia32_alignq256_mask ((__v4di)(__m256i)(X), \
13586 (__v4di)(__m256i)(Y), (int)(C), (__v4di)(__m256i)(W), (__mmask8)(U)))
13587
13588#define _mm256_maskz_alignr_epi64(U, X, Y, C) \
13589 ((__m256i)__builtin_ia32_alignq256_mask ((__v4di)(__m256i)(X), \
13590 (__v4di)(__m256i)(Y), (int)(C), (__v4di)(__m256i)_mm256_setzero_si256 (),\
13591 (__mmask8)(U)))
13592
13593#define _mm_alignr_epi32(X, Y, C) \
13594 ((__m128i)__builtin_ia32_alignd128_mask ((__v4si)(__m128i)(X), \
13595 (__v4si)(__m128i)(Y), (int)(C), (__v4si)(__m128i)(X), (__mmask8)-1))
13596
13597#define _mm_mask_alignr_epi32(W, U, X, Y, C) \
13598 ((__m128i)__builtin_ia32_alignd128_mask ((__v4si)(__m128i)(X), \
13599 (__v4si)(__m128i)(Y), (int)(C), (__v4si)(__m128i)(W), (__mmask8)(U)))
13600
13601#define _mm_maskz_alignr_epi32(U, X, Y, C) \
13602 ((__m128i)__builtin_ia32_alignd128_mask ((__v4si)(__m128i)(X), \
13603 (__v4si)(__m128i)(Y), (int)(C), (__v4si)(__m128i)_mm_setzero_si128 (),\
13604 (__mmask8)(U)))
13605
13606#define _mm_alignr_epi64(X, Y, C) \
13607 ((__m128i)__builtin_ia32_alignq128_mask ((__v2di)(__m128i)(X), \
13608 (__v2di)(__m128i)(Y), (int)(C), (__v2di)(__m128i)(X), (__mmask8)-1))
13609
13610#define _mm_mask_alignr_epi64(W, U, X, Y, C) \
13611 ((__m128i)__builtin_ia32_alignq128_mask ((__v2di)(__m128i)(X), \
13612 (__v2di)(__m128i)(Y), (int)(C), (__v2di)(__m128i)(X), (__mmask8)-1))
13613
13614#define _mm_maskz_alignr_epi64(U, X, Y, C) \
13615 ((__m128i)__builtin_ia32_alignq128_mask ((__v2di)(__m128i)(X), \
13616 (__v2di)(__m128i)(Y), (int)(C), (__v2di)(__m128i)_mm_setzero_si128 (),\
13617 (__mmask8)(U)))
13618
13619#define _mm_mask_cvtps_ph(W, U, A, I) \
13620 ((__m128i) __builtin_ia32_vcvtps2ph_mask ((__v4sf)(__m128) (A), (int) (I), \
13621 (__v8hi)(__m128i) (W), (__mmask8) (U)))
13622
13623#define _mm_maskz_cvtps_ph(U, A, I) \
13624 ((__m128i) __builtin_ia32_vcvtps2ph_mask ((__v4sf)(__m128) (A), (int) (I), \
13625 (__v8hi)(__m128i) _mm_setzero_si128 (), (__mmask8) (U)))
13626
13627#define _mm256_mask_cvtps_ph(W, U, A, I) \
13628 ((__m128i) __builtin_ia32_vcvtps2ph256_mask ((__v8sf)(__m256) (A), (int) (I), \
13629 (__v8hi)(__m128i) (W), (__mmask8) (U)))
13630
13631#define _mm256_maskz_cvtps_ph(U, A, I) \
13632 ((__m128i) __builtin_ia32_vcvtps2ph256_mask ((__v8sf)(__m256) (A), (int) (I), \
13633 (__v8hi)(__m128i) _mm_setzero_si128 (), (__mmask8) (U)))
13634
13635#define _mm256_mask_srai_epi32(W, U, A, B) \
13636 ((__m256i) __builtin_ia32_psradi256_mask ((__v8si)(__m256i)(A), \
13637 (int)(B), (__v8si)(__m256i)(W), (__mmask8)(U)))
13638
13639#define _mm256_maskz_srai_epi32(U, A, B) \
13640 ((__m256i) __builtin_ia32_psradi256_mask ((__v8si)(__m256i)(A), \
13641 (int)(B), (__v8si)_mm256_setzero_si256 (), (__mmask8)(U)))
13642
13643#define _mm_mask_srai_epi32(W, U, A, B) \
13644 ((__m128i) __builtin_ia32_psradi128_mask ((__v4si)(__m128i)(A), \
13645 (int)(B), (__v4si)(__m128i)(W), (__mmask8)(U)))
13646
13647#define _mm_maskz_srai_epi32(U, A, B) \
13648 ((__m128i) __builtin_ia32_psradi128_mask ((__v4si)(__m128i)(A), \
13649 (int)(B), (__v4si)_mm_setzero_si128 (), (__mmask8)(U)))
13650
13651#define _mm256_srai_epi64(A, B) \
13652 ((__m256i) __builtin_ia32_psraqi256_mask ((__v4di)(__m256i)(A), \
13653 (int)(B), (__v4di)_mm256_setzero_si256 (), (__mmask8)-1))
13654
13655#define _mm256_mask_srai_epi64(W, U, A, B) \
13656 ((__m256i) __builtin_ia32_psraqi256_mask ((__v4di)(__m256i)(A), \
13657 (int)(B), (__v4di)(__m256i)(W), (__mmask8)(U)))
13658
13659#define _mm256_maskz_srai_epi64(U, A, B) \
13660 ((__m256i) __builtin_ia32_psraqi256_mask ((__v4di)(__m256i)(A), \
13661 (int)(B), (__v4di)_mm256_setzero_si256 (), (__mmask8)(U)))
13662
13663#define _mm_srai_epi64(A, B) \
13664 ((__m128i) __builtin_ia32_psraqi128_mask ((__v2di)(__m128i)(A), \
13665 (int)(B), (__v2di)_mm_setzero_si128 (), (__mmask8)-1))
13666
13667#define _mm_mask_srai_epi64(W, U, A, B) \
13668 ((__m128i) __builtin_ia32_psraqi128_mask ((__v2di)(__m128i)(A), \
13669 (int)(B), (__v2di)(__m128i)(W), (__mmask8)(U)))
13670
13671#define _mm_maskz_srai_epi64(U, A, B) \
13672 ((__m128i) __builtin_ia32_psraqi128_mask ((__v2di)(__m128i)(A), \
13673 (int)(B), (__v2di)_mm_setzero_si128 (), (__mmask8)(U)))
13674
13675#define _mm256_mask_permutex_pd(W, U, A, B) \
13676 ((__m256d) __builtin_ia32_permdf256_mask ((__v4df)(__m256d)(A), \
13677 (int)(B), (__v4df)(__m256d)(W), (__mmask8)(U)))
13678
13679#define _mm256_maskz_permutex_pd(U, A, B) \
13680 ((__m256d) __builtin_ia32_permdf256_mask ((__v4df)(__m256d)(A), \
13681 (int)(B), (__v4df)(__m256d)_mm256_setzero_pd (), (__mmask8)(U)))
13682
13683#define _mm256_mask_permute_pd(W, U, X, C) \
13684 ((__m256d) __builtin_ia32_vpermilpd256_mask ((__v4df)(__m256d)(X), (int)(C), \
13685 (__v4df)(__m256d)(W), \
13686 (__mmask8)(U)))
13687
13688#define _mm256_maskz_permute_pd(U, X, C) \
13689 ((__m256d) __builtin_ia32_vpermilpd256_mask ((__v4df)(__m256d)(X), (int)(C), \
13690 (__v4df)(__m256d)_mm256_setzero_pd (),\
13691 (__mmask8)(U)))
13692
13693#define _mm256_mask_permute_ps(W, U, X, C) \
13694 ((__m256) __builtin_ia32_vpermilps256_mask ((__v8sf)(__m256)(X), (int)(C), \
13695 (__v8sf)(__m256)(W), (__mmask8)(U)))
13696
13697#define _mm256_maskz_permute_ps(U, X, C) \
13698 ((__m256) __builtin_ia32_vpermilps256_mask ((__v8sf)(__m256)(X), (int)(C), \
13699 (__v8sf)(__m256)_mm256_setzero_ps (), \
13700 (__mmask8)(U)))
13701
13702#define _mm_mask_permute_pd(W, U, X, C) \
13703 ((__m128d) __builtin_ia32_vpermilpd_mask ((__v2df)(__m128d)(X), (int)(C), \
13704 (__v2df)(__m128d)(W), (__mmask8)(U)))
13705
13706#define _mm_maskz_permute_pd(U, X, C) \
13707 ((__m128d) __builtin_ia32_vpermilpd_mask ((__v2df)(__m128d)(X), (int)(C), \
13708 (__v2df)(__m128d)_mm_setzero_pd (), \
13709 (__mmask8)(U)))
13710
13711#define _mm_mask_permute_ps(W, U, X, C) \
13712 ((__m128) __builtin_ia32_vpermilps_mask ((__v4sf)(__m128)(X), (int)(C), \
13713 (__v4sf)(__m128)(W), (__mmask8)(U)))
13714
13715#define _mm_maskz_permute_ps(U, X, C) \
13716 ((__m128) __builtin_ia32_vpermilps_mask ((__v4sf)(__m128)(X), (int)(C), \
13717 (__v4sf)(__m128)_mm_setzero_ps (), \
13718 (__mmask8)(U)))
13719
13720#define _mm256_mask_blend_pd(__U, __A, __W) \
13721 ((__m256d) __builtin_ia32_blendmpd_256_mask ((__v4df) (__A), \
13722 (__v4df) (__W), \
13723 (__mmask8) (__U)))
13724
13725#define _mm256_mask_blend_ps(__U, __A, __W) \
13726 ((__m256) __builtin_ia32_blendmps_256_mask ((__v8sf) (__A), \
13727 (__v8sf) (__W), \
13728 (__mmask8) (__U)))
13729
13730#define _mm256_mask_blend_epi64(__U, __A, __W) \
13731 ((__m256i) __builtin_ia32_blendmq_256_mask ((__v4di) (__A), \
13732 (__v4di) (__W), \
13733 (__mmask8) (__U)))
13734
13735#define _mm256_mask_blend_epi32(__U, __A, __W) \
13736 ((__m256i) __builtin_ia32_blendmd_256_mask ((__v8si) (__A), \
13737 (__v8si) (__W), \
13738 (__mmask8) (__U)))
13739
13740#define _mm_mask_blend_pd(__U, __A, __W) \
13741 ((__m128d) __builtin_ia32_blendmpd_128_mask ((__v2df) (__A), \
13742 (__v2df) (__W), \
13743 (__mmask8) (__U)))
13744
13745#define _mm_mask_blend_ps(__U, __A, __W) \
13746 ((__m128) __builtin_ia32_blendmps_128_mask ((__v4sf) (__A), \
13747 (__v4sf) (__W), \
13748 (__mmask8) (__U)))
13749
13750#define _mm_mask_blend_epi64(__U, __A, __W) \
13751 ((__m128i) __builtin_ia32_blendmq_128_mask ((__v2di) (__A), \
13752 (__v2di) (__W), \
13753 (__mmask8) (__U)))
13754
13755#define _mm_mask_blend_epi32(__U, __A, __W) \
13756 ((__m128i) __builtin_ia32_blendmd_128_mask ((__v4si) (__A), \
13757 (__v4si) (__W), \
13758 (__mmask8) (__U)))
13759
13760#define _mm256_cmp_epu32_mask(X, Y, P) \
13761 ((__mmask8) __builtin_ia32_ucmpd256_mask ((__v8si)(__m256i)(X), \
13762 (__v8si)(__m256i)(Y), (int)(P),\
13763 (__mmask8)-1))
13764
13765#define _mm256_cmp_epi64_mask(X, Y, P) \
13766 ((__mmask8) __builtin_ia32_cmpq256_mask ((__v4di)(__m256i)(X), \
13767 (__v4di)(__m256i)(Y), (int)(P),\
13768 (__mmask8)-1))
13769
13770#define _mm256_cmp_epi32_mask(X, Y, P) \
13771 ((__mmask8) __builtin_ia32_cmpd256_mask ((__v8si)(__m256i)(X), \
13772 (__v8si)(__m256i)(Y), (int)(P),\
13773 (__mmask8)-1))
13774
13775#define _mm256_cmp_epu64_mask(X, Y, P) \
13776 ((__mmask8) __builtin_ia32_ucmpq256_mask ((__v4di)(__m256i)(X), \
13777 (__v4di)(__m256i)(Y), (int)(P),\
13778 (__mmask8)-1))
13779
13780#define _mm256_cmp_pd_mask(X, Y, P) \
13781 ((__mmask8) __builtin_ia32_cmppd256_mask ((__v4df)(__m256d)(X), \
13782 (__v4df)(__m256d)(Y), (int)(P),\
13783 (__mmask8)-1))
13784
13785#define _mm256_cmp_ps_mask(X, Y, P) \
13786 ((__mmask8) __builtin_ia32_cmpps256_mask ((__v8sf)(__m256)(X), \
13787 (__v8sf)(__m256)(Y), (int)(P),\
13788 (__mmask8)-1))
13789
13790#define _mm256_mask_cmp_epi64_mask(M, X, Y, P) \
13791 ((__mmask8) __builtin_ia32_cmpq256_mask ((__v4di)(__m256i)(X), \
13792 (__v4di)(__m256i)(Y), (int)(P),\
13793 (__mmask8)(M)))
13794
13795#define _mm256_mask_cmp_epi32_mask(M, X, Y, P) \
13796 ((__mmask8) __builtin_ia32_cmpd256_mask ((__v8si)(__m256i)(X), \
13797 (__v8si)(__m256i)(Y), (int)(P),\
13798 (__mmask8)(M)))
13799
13800#define _mm256_mask_cmp_epu64_mask(M, X, Y, P) \
13801 ((__mmask8) __builtin_ia32_ucmpq256_mask ((__v4di)(__m256i)(X), \
13802 (__v4di)(__m256i)(Y), (int)(P),\
13803 (__mmask8)(M)))
13804
13805#define _mm256_mask_cmp_epu32_mask(M, X, Y, P) \
13806 ((__mmask8) __builtin_ia32_ucmpd256_mask ((__v8si)(__m256i)(X), \
13807 (__v8si)(__m256i)(Y), (int)(P),\
13808 (__mmask8)(M)))
13809
13810#define _mm256_mask_cmp_pd_mask(M, X, Y, P) \
13811 ((__mmask8) __builtin_ia32_cmppd256_mask ((__v4df)(__m256d)(X), \
13812 (__v4df)(__m256d)(Y), (int)(P),\
13813 (__mmask8)(M)))
13814
13815#define _mm256_mask_cmp_ps_mask(M, X, Y, P) \
13816 ((__mmask8) __builtin_ia32_cmpps256_mask ((__v8sf)(__m256)(X), \
13817 (__v8sf)(__m256)(Y), (int)(P),\
13818 (__mmask8)(M)))
13819
13820#define _mm_cmp_epi64_mask(X, Y, P) \
13821 ((__mmask8) __builtin_ia32_cmpq128_mask ((__v2di)(__m128i)(X), \
13822 (__v2di)(__m128i)(Y), (int)(P),\
13823 (__mmask8)-1))
13824
13825#define _mm_cmp_epi32_mask(X, Y, P) \
13826 ((__mmask8) __builtin_ia32_cmpd128_mask ((__v4si)(__m128i)(X), \
13827 (__v4si)(__m128i)(Y), (int)(P),\
13828 (__mmask8)-1))
13829
13830#define _mm_cmp_epu64_mask(X, Y, P) \
13831 ((__mmask8) __builtin_ia32_ucmpq128_mask ((__v2di)(__m128i)(X), \
13832 (__v2di)(__m128i)(Y), (int)(P),\
13833 (__mmask8)-1))
13834
13835#define _mm_cmp_epu32_mask(X, Y, P) \
13836 ((__mmask8) __builtin_ia32_ucmpd128_mask ((__v4si)(__m128i)(X), \
13837 (__v4si)(__m128i)(Y), (int)(P),\
13838 (__mmask8)-1))
13839
13840#define _mm_cmp_pd_mask(X, Y, P) \
13841 ((__mmask8) __builtin_ia32_cmppd128_mask ((__v2df)(__m128d)(X), \
13842 (__v2df)(__m128d)(Y), (int)(P),\
13843 (__mmask8)-1))
13844
13845#define _mm_cmp_ps_mask(X, Y, P) \
13846 ((__mmask8) __builtin_ia32_cmpps128_mask ((__v4sf)(__m128)(X), \
13847 (__v4sf)(__m128)(Y), (int)(P),\
13848 (__mmask8)-1))
13849
13850#define _mm_mask_cmp_epi64_mask(M, X, Y, P) \
13851 ((__mmask8) __builtin_ia32_cmpq128_mask ((__v2di)(__m128i)(X), \
13852 (__v2di)(__m128i)(Y), (int)(P),\
13853 (__mmask8)(M)))
13854
13855#define _mm_mask_cmp_epi32_mask(M, X, Y, P) \
13856 ((__mmask8) __builtin_ia32_cmpd128_mask ((__v4si)(__m128i)(X), \
13857 (__v4si)(__m128i)(Y), (int)(P),\
13858 (__mmask8)(M)))
13859
13860#define _mm_mask_cmp_epu64_mask(M, X, Y, P) \
13861 ((__mmask8) __builtin_ia32_ucmpq128_mask ((__v2di)(__m128i)(X), \
13862 (__v2di)(__m128i)(Y), (int)(P),\
13863 (__mmask8)(M)))
13864
13865#define _mm_mask_cmp_epu32_mask(M, X, Y, P) \
13866 ((__mmask8) __builtin_ia32_ucmpd128_mask ((__v4si)(__m128i)(X), \
13867 (__v4si)(__m128i)(Y), (int)(P),\
13868 (__mmask8)(M)))
13869
13870#define _mm_mask_cmp_pd_mask(M, X, Y, P) \
13871 ((__mmask8) __builtin_ia32_cmppd128_mask ((__v2df)(__m128d)(X), \
13872 (__v2df)(__m128d)(Y), (int)(P),\
13873 (__mmask8)(M)))
13874
13875#define _mm_mask_cmp_ps_mask(M, X, Y, P) \
13876 ((__mmask8) __builtin_ia32_cmpps128_mask ((__v4sf)(__m128)(X), \
13877 (__v4sf)(__m128)(Y), (int)(P),\
13878 (__mmask8)(M)))
13879
13880#endif
13881
13882#define _mm256_permutexvar_ps(A, B) _mm256_permutevar8x32_ps ((B), (A))
13883#define _mm256_mask_cvt_roundps_ph(A, B, C, D) \
13884 _mm256_mask_cvtps_ph ((A), (B), (C), (D))
13885#define _mm256_maskz_cvt_roundps_ph(A, B, C) \
13886 _mm256_maskz_cvtps_ph ((A), (B), (C))
13887#define _mm_mask_cvt_roundps_ph(A, B, C, D) \
13888 _mm_mask_cvtps_ph ((A), (B), (C), (D))
13889#define _mm_maskz_cvt_roundps_ph(A, B, C) _mm_maskz_cvtps_ph ((A), (B), (C))
13890
13891#ifdef __DISABLE_AVX512VL__
13892#undef __DISABLE_AVX512VL__
13893#pragma GCC pop_options
13894#endif /* __DISABLE_AVX512VL__ */
13895
13896#endif /* _AVX512VLINTRIN_H_INCLUDED */
unsigned char __mmask8
unsigned short __mmask16
_MM_MANTISSA_NORM_ENUM
_MM_MANTISSA_SIGN_ENUM
__inline __m512i int int int int int int int int int int int int int int __O
_MM_PERM_ENUM
__inline __m512d __m512d __m512d __W
#define _mm256_mmask_i64gather_pd(V1OLD, MASK, INDEX, ADDR, SCALE)
#define _mm_mask_roundscale_pd(W, U, A, B)
#define _mm256_mask_cmp_pd_mask(M, X, Y, P)
#define _mm_i32scatter_pd(ADDR, INDEX, V1, SCALE)
#define _mm_i32scatter_ps(ADDR, INDEX, V1, SCALE)
#define _mm_mask_i32scatter_epi32(ADDR, MASK, INDEX, V1, SCALE)
#define _mm_mmask_i32gather_epi32(V1OLD, MASK, INDEX, ADDR, SCALE)
#define _mm_mask_cmp_epu64_mask(M, X, Y, P)
#define _mm256_maskz_ror_epi64(U, A, B)
#define _mm256_mask_permute_pd(W, U, X, C)
#define _mm256_shuffle_i32x4(X, Y, C)
#define _mm_mask_ror_epi64(W, U, A, B)
#define _mm256_mask_i32scatter_pd(ADDR, MASK, INDEX, V1, SCALE)
#define _mm_mask_srai_epi32(W, U, A, B)
#define _mm256_mask_blend_ps(__U, __A, __W)
#define _mm_mask_shuffle_epi32(W, U, X, C)
#define _mm_srai_epi64(A, B)
#define _mm_i64scatter_ps(ADDR, INDEX, V1, SCALE)
#define _mm256_roundscale_pd(A, B)
#define _mm_roundscale_pd(A, B)
#define _mm256_maskz_ternarylogic_epi32(U, A, B, C, I)
#define _mm256_getmant_ps(X, B, C)
#define _mm256_i32scatter_epi64(ADDR, INDEX, V1, SCALE)
#define _mm256_maskz_shuffle_ps(U, A, B, C)
__inline __m256i __mmask8 __m128i __X
#define _mm_alignr_epi64(X, Y, C)
#define _mm256_i32scatter_ps(ADDR, INDEX, V1, SCALE)
#define _mm_cmp_epu32_mask(X, Y, P)
#define _mm256_mmask_i32gather_ps(V1OLD, MASK, INDEX, ADDR, SCALE)
#define _mm256_getmant_pd(X, B, C)
#define _mm_mask_i64scatter_epi32(ADDR, MASK, INDEX, V1, SCALE)
#define _mm_mask_i32scatter_pd(ADDR, MASK, INDEX, V1, SCALE)
#define _mm_maskz_fixupimm_pd(U, X, Y, Z, C)
#define _mm_mask_permute_ps(W, U, X, C)
#define _mm256_maskz_srai_epi64(U, A, B)
#define _mm_maskz_alignr_epi32(U, X, Y, C)
#define _mm_maskz_rol_epi64(U, A, B)
#define _mm256_maskz_permute_ps(U, X, C)
#define _mm256_mask_getmant_pd(W, U, X, B, C)
#define _mm256_maskz_shuffle_f64x2(U, X, Y, C)
#define _mm_mask_shuffle_ps(W, U, A, B, C)
#define _mm256_mask_permutex_epi64(W, M, X, I)
#define _mm256_mask_srli_epi32(W, U, A, B)
#define _mm256_alignr_epi32(X, Y, C)
#define _mm256_maskz_fixupimm_pd(U, X, Y, Z, C)
#define _mm256_maskz_permutex_epi64(M, X, I)
#define _mm_mask_i64scatter_epi64(ADDR, MASK, INDEX, V1, SCALE)
#define _mm256_mask_fixupimm_pd(X, U, Y, Z, C)
#define _mm256_permutex_epi64(X, I)
#define _mm_mmask_i32gather_pd(V1OLD, MASK, INDEX, ADDR, SCALE)
#define _mm256_mask_insertf32x4(W, U, X, Y, C)
#define _mm_maskz_ternarylogic_epi64(U, A, B, C, I)
#define _mm_cmp_ps_mask(X, Y, P)
#define _mm_cmp_epi32_mask(X, Y, P)
#define _mm_mask_getmant_ps(W, U, X, B, C)
#define _mm256_mask_srli_epi64(W, U, A, B)
#define _mm256_maskz_slli_epi64(U, X, C)
#define _mm_mask_cvtps_ph(W, U, A, I)
#define _mm256_maskz_roundscale_pd(U, A, B)
#define _mm_mmask_i64gather_ps(V1OLD, MASK, INDEX, ADDR, SCALE)
#define _mm256_shuffle_i64x2(X, Y, C)
#define _mm256_mask_i64scatter_epi64(ADDR, MASK, INDEX, V1, SCALE)
#define _mm256_mmask_i32gather_epi64(V1OLD, MASK, INDEX, ADDR, SCALE)
#define _mm256_maskz_cvtps_ph(U, A, I)
#define _mm256_shuffle_f32x4(X, Y, C)
#define _mm_mask_cmp_ps_mask(M, X, Y, P)
#define _mm256_i64scatter_epi32(ADDR, INDEX, V1, SCALE)
#define _mm256_maskz_rol_epi32(U, A, B)
#define _mm256_mask_blend_pd(__U, __A, __W)
#define _mm256_mask_cmp_ps_mask(M, X, Y, P)
#define _mm256_mask_cmp_epu64_mask(M, X, Y, P)
#define _mm256_maskz_shuffle_i32x4(U, X, Y, C)
#define _mm256_maskz_getmant_pd(U, X, B, C)
#define _mm_i64scatter_epi64(ADDR, INDEX, V1, SCALE)
#define _mm_maskz_srli_epi32(U, A, B)
#define _mm_mmask_i32gather_ps(V1OLD, MASK, INDEX, ADDR, SCALE)
#define _mm_maskz_roundscale_pd(U, A, B)
#define _mm_mask_rol_epi64(W, U, A, B)
#define _mm_mask_blend_ps(__U, __A, __W)
#define _mm256_maskz_shuffle_epi32(U, X, C)
#define _mm256_cmp_epu32_mask(X, Y, P)
#define _mm_fixupimm_pd(X, Y, Z, C)
#define _mm_mask_permute_pd(W, U, X, C)
#define _mm256_maskz_slli_epi32(U, X, C)
#define _mm256_rol_epi64(A, B)
#define _mm256_cmp_epi64_mask(X, Y, P)
#define _mm_mmask_i64gather_epi32(V1OLD, MASK, INDEX, ADDR, SCALE)
#define _mm_ror_epi32(A, B)
__inline __m128d __mmask8 __m128d __m128d __B
#define _mm_maskz_srai_epi32(U, A, B)
#define _mm256_mask_i64scatter_ps(ADDR, MASK, INDEX, V1, SCALE)
#define _mm_mask_i32scatter_epi64(ADDR, MASK, INDEX, V1, SCALE)
#define _mm256_mask_srai_epi32(W, U, A, B)
#define _mm256_permutex_pd(X, M)
#define _mm256_mask_i32scatter_ps(ADDR, MASK, INDEX, V1, SCALE)
#define _mm_maskz_ror_epi32(U, A, B)
#define _mm256_mask_slli_epi64(W, U, X, C)
#define _mm_mmask_i64gather_pd(V1OLD, MASK, INDEX, ADDR, SCALE)
#define _mm256_insertf32x4(X, Y, C)
#define _mm256_maskz_ternarylogic_epi64(U, A, B, C, I)
#define _mm_mask_roundscale_ps(W, U, A, B)
#define _mm256_maskz_insertf32x4(U, X, Y, C)
#define _mm256_mask_i64scatter_pd(ADDR, MASK, INDEX, V1, SCALE)
#define _mm_mask_slli_epi64(W, U, X, C)
#define _mm_mask_cmp_epu32_mask(M, X, Y, P)
#define _mm256_mask_shuffle_i32x4(W, U, X, Y, C)
#define _mm256_maskz_permutex_pd(U, A, B)
#define _mm256_mmask_i32gather_epi32(V1OLD, MASK, INDEX, ADDR, SCALE)
#define _mm256_rol_epi32(A, B)
#define _mm_mask_blend_pd(__U, __A, __W)
#define _mm_fixupimm_ps(X, Y, Z, C)
#define _mm_cmp_epi64_mask(X, Y, P)
#define _mm256_mask_ternarylogic_epi64(A, U, B, C, I)
#define _mm256_alignr_epi64(X, Y, C)
#define _mm_maskz_rol_epi32(U, A, B)
#define _mm_mask_srli_epi64(W, U, A, B)
#define _mm256_maskz_shuffle_i64x2(U, X, Y, C)
#define _mm256_maskz_roundscale_ps(U, A, B)
#define _mm_roundscale_ps(A, B)
#define _mm_ternarylogic_epi64(A, B, C, I)
#define _mm256_mask_shuffle_ps(W, U, A, B, C)
#define _mm256_ror_epi64(A, B)
#define _mm256_roundscale_ps(A, B)
#define _mm256_shuffle_f64x2(X, Y, C)
#define _mm256_mask_alignr_epi32(W, U, X, Y, C)
#define _mm_mmask_i32gather_epi64(V1OLD, MASK, INDEX, ADDR, SCALE)
#define _mm_mask_fixupimm_pd(X, U, Y, Z, C)
#define _mm256_mask_rol_epi64(W, U, A, B)
#define _mm256_maskz_ror_epi32(U, A, B)
#define _mm_getmant_pd(X, B, C)
#define _mm256_ror_epi32(A, B)
#define _mm256_maskz_alignr_epi64(U, X, Y, C)
#define _mm_rol_epi64(A, B)
#define _mm256_inserti32x4(X, Y, C)
#define _mm_i64scatter_epi32(ADDR, INDEX, V1, SCALE)
__inline __m256d __mmask8 __U
#define _mm256_mask_fixupimm_ps(X, U, Y, Z, C)
#define _mm_mask_cmp_epi32_mask(M, X, Y, P)
#define _mm256_mask_shuffle_f64x2(W, U, X, Y, C)
#define _mm256_maskz_shuffle_pd(U, A, B, C)
#define _mm256_mask_blend_epi64(__U, __A, __W)
#define _mm_cmp_pd_mask(X, Y, P)
#define _mm256_mask_roundscale_ps(W, U, A, B)
#define _mm256_mask_getmant_ps(W, U, X, B, C)
#define _mm_mask_ror_epi32(W, U, A, B)
#define _mm256_maskz_extracti32x4_epi32(U, X, C)
#define _mm_ror_epi64(A, B)
#define _mm256_mask_shuffle_pd(W, U, A, B, C)
__inline __m256d __mmask8 void const * __P
__inline void __mmask8 __M
#define _mm_mask_fixupimm_ps(X, U, Y, Z, C)
#define _mm256_fixupimm_pd(X, Y, Z, C)
#define _mm_maskz_ternarylogic_epi32(U, A, B, C, I)
#define _mm256_mask_inserti32x4(W, U, X, Y, C)
__inline __m256d __mmask8 __m256d __m256d __C
#define _mm_maskz_fixupimm_ps(U, X, Y, Z, C)
#define _mm256_mmask_i64gather_ps(V1OLD, MASK, INDEX, ADDR, SCALE)
#define _mm256_mask_cmp_epi32_mask(M, X, Y, P)
#define _mm_maskz_shuffle_epi32(U, X, C)
#define _mm_maskz_slli_epi32(U, X, C)
#define _mm256_mask_cmp_epi64_mask(M, X, Y, P)
#define _mm_mask_getmant_pd(W, U, X, B, C)
#define _mm_getmant_ps(X, B, C)
#define _mm256_ternarylogic_epi64(A, B, C, I)
#define _mm256_maskz_srli_epi32(U, A, B)
#define _mm_mask_i32scatter_ps(ADDR, MASK, INDEX, V1, SCALE)
#define _mm256_maskz_shuffle_f32x4(U, X, Y, C)
#define _mm256_ternarylogic_epi32(A, B, C, I)
#define _mm_mask_cmp_epi64_mask(M, X, Y, P)
#define _mm256_mask_srai_epi64(W, U, A, B)
#define _mm_mask_i64scatter_pd(ADDR, MASK, INDEX, V1, SCALE)
#define _mm256_i64scatter_epi64(ADDR, INDEX, V1, SCALE)
#define _mm256_mask_cvtps_ph(W, U, A, I)
#define _mm256_mask_shuffle_f32x4(W, U, X, Y, C)
#define _mm_maskz_permute_ps(U, X, C)
#define _mm_mask_ternarylogic_epi64(A, U, B, C, I)
#define _mm_mask_ternarylogic_epi32(A, U, B, C, I)
#define _mm256_fixupimm_ps(X, Y, Z, C)
#define _mm_mask_rol_epi32(W, U, A, B)
#define _mm_maskz_shuffle_ps(U, A, B, C)
#define _mm256_mmask_i64gather_epi64(V1OLD, MASK, INDEX, ADDR, SCALE)
#define _mm256_maskz_fixupimm_ps(U, X, Y, Z, C)
#define _mm256_maskz_srai_epi32(U, A, B)
#define _mm_mask_slli_epi32(W, U, X, C)
#define _mm_maskz_alignr_epi64(U, X, Y, C)
#define _mm256_maskz_inserti32x4(U, X, Y, C)
#define _mm_i64scatter_pd(ADDR, INDEX, V1, SCALE)
#define _mm_maskz_shuffle_pd(U, A, B, C)
#define _mm_mmask_i64gather_epi64(V1OLD, MASK, INDEX, ADDR, SCALE)
#define _mm_maskz_getmant_ps(U, X, B, C)
#define _mm_i32scatter_epi64(ADDR, INDEX, V1, SCALE)
#define _mm256_cmp_epi32_mask(X, Y, P)
#define _mm256_mask_extractf32x4_ps(W, U, X, C)
#define _mm256_maskz_alignr_epi32(U, X, Y, C)
#define _mm256_mask_blend_epi32(__U, __A, __W)
#define _mm256_mask_i32scatter_epi64(ADDR, MASK, INDEX, V1, SCALE)
#define _mm256_maskz_srli_epi64(U, A, B)
#define _mm256_maskz_getmant_ps(U, X, B, C)
#define _mm256_maskz_permute_pd(U, X, C)
#define _mm256_mmask_i32gather_pd(V1OLD, MASK, INDEX, ADDR, SCALE)
#define _mm256_cmp_epu64_mask(X, Y, P)
#define _mm256_mask_permutex_pd(W, U, A, B)
#define _mm256_i32scatter_epi32(ADDR, INDEX, V1, SCALE)
#define _mm256_i64scatter_ps(ADDR, INDEX, V1, SCALE)
#define _mm_maskz_permute_pd(U, X, C)
__inline __m128i __m128i __Y
#define _mm256_mask_i32scatter_epi32(ADDR, MASK, INDEX, V1, SCALE)
#define _mm_alignr_epi32(X, Y, C)
#define _mm256_mask_ror_epi64(W, U, A, B)
#define _mm256_mask_roundscale_pd(W, U, A, B)
#define _mm256_srai_epi64(A, B)
#define _mm256_mask_extracti32x4_epi32(W, U, X, C)
#define _mm256_mask_permute_ps(W, U, X, C)
#define _mm256_mask_shuffle_epi32(W, U, X, C)
#define _mm256_maskz_extractf32x4_ps(U, X, C)
#define _mm_maskz_getmant_pd(U, X, B, C)
#define _mm256_mask_shuffle_i64x2(W, U, X, Y, C)
#define _mm_mask_alignr_epi64(W, U, X, Y, C)
unsigned int __mmask32
#define _mm_i32scatter_epi32(ADDR, INDEX, V1, SCALE)
#define _mm256_mask_slli_epi32(W, U, X, C)
#define _mm256_mask_ternarylogic_epi32(A, U, B, C, I)
#define _mm256_mmask_i64gather_epi32(V1OLD, MASK, INDEX, ADDR, SCALE)
__inline __m256d __m256i __I
#define _mm256_mask_alignr_epi64(W, U, X, Y, C)
#define _mm256_cmp_ps_mask(X, Y, P)
#define _mm256_i32scatter_pd(ADDR, INDEX, V1, SCALE)
#define _mm256_extracti32x4_epi32(X, C)
__inline __m256d __mmask8 __m256d __A
#define _mm256_i64scatter_pd(ADDR, INDEX, V1, SCALE)
#define _mm_mask_srai_epi64(W, U, A, B)
#define _mm256_maskz_rol_epi64(U, A, B)
#define _mm_mask_i64scatter_ps(ADDR, MASK, INDEX, V1, SCALE)
#define _mm256_mask_i64scatter_epi32(ADDR, MASK, INDEX, V1, SCALE)
#define _mm_mask_alignr_epi32(W, U, X, Y, C)
#define _mm_ternarylogic_epi32(A, B, C, I)
#define _mm_maskz_roundscale_ps(U, A, B)
#define _mm256_extractf32x4_ps(X, C)
#define _mm_mask_blend_epi32(__U, __A, __W)
#define _mm_mask_cmp_pd_mask(M, X, Y, P)
#define _mm_maskz_srai_epi64(U, A, B)
#define _mm256_mask_ror_epi32(W, U, A, B)
#define _mm256_mask_cmp_epu32_mask(M, X, Y, P)
#define _mm_mask_blend_epi64(__U, __A, __W)
int __v4si_u __attribute__((__vector_size__(16), __may_alias__, __aligned__(1)))
#define _mm_maskz_cvtps_ph(U, A, I)
#define _mm256_cmp_pd_mask(X, Y, P)
#define _mm_mask_shuffle_pd(W, U, A, B, C)
#define _mm256_mask_rol_epi32(W, U, A, B)
#define _mm_maskz_slli_epi64(U, X, C)
#define _mm_maskz_ror_epi64(U, A, B)
#define _mm_mask_srli_epi32(W, U, A, B)
#define _mm_maskz_srli_epi64(U, A, B)
#define _mm_rol_epi32(A, B)
#define _mm_cmp_epu64_mask(X, Y, P)
GLintptr offset
Definition gl2ext.h:1470